diff --git a/.gitattributes b/.gitattributes index c7d9f3332a950355d5a77d85000f05e6f45435ea..463557ab2ca226e0eb475b488049813ff7df114c 100644 --- a/.gitattributes +++ b/.gitattributes @@ -32,3 +32,51 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text diff --git a/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-web_nlg_en_PALM_prompt_0.json b/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..fe25d06bc8fadad4eede133a4df6140d766ac7bf --- /dev/null +++ b/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.4712440224858371, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.041795896662364315}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.08494278433659254, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002682014199464667}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3010315100774798, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005434382926718196}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11420475482093911, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022183305831393195}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03708415721222578, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0015055606328312114}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.14224175280721357, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0032367826210838984}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.051776101353314175, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012810666933093713}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07986488274116094, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0025364066921602967}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2851084703862567, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.005103727035204417}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10723944522759159, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002017538602140417}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.08031203138023377, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0025700547990470703}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2832049885841092, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00501983173550152}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10754705129811067, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002066923006506901}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-web_nlg_en_PALM_prompt_1.json b/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..915d34a365dbe6bcff1c0a6608ff228821757b61 --- /dev/null +++ b/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6352422858353469, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04386319262846487}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.14729082149250516, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004315116801617204}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.34501701041772753, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004883560454809294}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.17595828606649466, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0037103128590180736}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.0749912603946425, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0029697645981284103}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.17507177387031794, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0035680879509635034}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.08797235452625987, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002563800160615811}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.13087012462145003, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0037359089786958557}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3214469196295103, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004518231473535444}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1587241385605771, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0031813191221144485}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.13443162008077075, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0038480943977239573}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.32447309188867546, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0044995663315275155}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.16209364614512511, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.003268839028418146}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-web_nlg_en_PALM_prompt_2.json b/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..4361c4bd406056deaca414d58e242281bba6a389 --- /dev/null +++ b/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.9195810919624675, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04315216107683015}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.19281853446958125, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005348179657635172}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3839239693259562, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004896794421772872}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.21485950562026987, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004330200790716057}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.1059225294754287, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0036916446521448806}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20457409251843786, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0037775743582373947}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.11382579286837109, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0029731216918058084}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.16888883147055286, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00457575327708451}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.35302151670878984, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004443535122018173}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1905777152487244, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0036266046372882984}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.17526191475368208, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004769580382692894}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.35984651407202956, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004507478564774203}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1966781681343204, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0037869984327305512}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-web_nlg_en_PALM_prompt_3.json b/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..18b6e7a76babd31912845236c3fbff3a44bd2c96 --- /dev/null +++ b/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 1.0349566025343735, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03887674612290353}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.20438835211537978, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005665805208271208}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.39198992418866246, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004947498335222262}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.2237082219543607, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004572034500678942}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.11365499071190853, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00397252439813096}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.2111302605559281, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003926393767113415}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.1207306381621409, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.003262380279344123}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.17756713475764335, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004833439612735641}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3583014136638203, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004476979554028604}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.196789710556852, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0038281461566836554}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.18556820599751273, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00508629808674153}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3664900622762122, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004561176586485258}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.20416935580581227, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.004021347054930177}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-web_nlg_en_PALM_prompt_4.json b/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..c822c5de8bb890a428b4221e70fa6a48b1ee03c8 --- /dev/null +++ b/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 1.1673998473534046, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09133948510400369}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.2125195111528658, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005730453983133926}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.40637639113635166, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004933922377880338}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.23196338111553216, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004558457306896048}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.11875092253811664, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0039714331213516595}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.22248575515884728, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.004014145150661029}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.12559736589051002, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.003188817274548042}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.1843607825179914, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0048800492055134925}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.370665372766866, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004464677380992271}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.2038615706419507, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003812860468542949}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.19370515184964268, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.005184788234116766}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3806829975264072, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004583640895651089}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.2125920854603434, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.004058013873763605}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-web_nlg_en_PALM_prompt_5.json b/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..1ea762b5c4b8397aa789ed176a92725431f0ad6c --- /dev/null +++ b/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 1.194760741144373, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09038400286323779}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.22388107728965712, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0058375878448932725}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.41258053843820386, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004808891702805189}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.24067238350377898, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004627635578763758}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.12470779957706617, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.004011608962377894}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.22396081182592556, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003932938864761309}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.12988590207293185, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.003239297680717399}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.19195297464964095, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004914089701123312}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.37374160359881364, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00433847098671097}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.20930811896578502, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0038259333936250185}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.20275170487892208, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.005253109590732199}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3844755575959121, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004448663215506157}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.21923266732565286, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.004087600756703223}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-wiki_lingua_en_tldr_en_0.json b/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..bda8a9d0efd61925504b7e7bc993ba26ece35cab --- /dev/null +++ b/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.11259234653795358, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032411862971363117}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.14340893843595093, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0034694907773717048}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.10762579083182928, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025835076322910672}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.02582999428983234, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010000072112516562}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.03784241933814092, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001450453403192633}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.02778920003491775, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.000982242456017776}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.08841484558766141, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0027853934411114305}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1114317644839379, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0027453844256091257}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.08192620888873649, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019339948879164794}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1068082984161991, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031424461382987463}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.13490305217744453, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0032803950524800847}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.10120163014874665, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002435237757238233}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.170472303270534, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09245843828343826}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-wiki_lingua_en_tldr_en_1.json b/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..f8a39132295bf07932cd1de47009aa1cfc1356a8 --- /dev/null +++ b/8b7178b44b/evaluation/generation/agg.8b7178b44b_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.19504169763237164, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003161655570483573}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2268980166797919, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00336143207911689}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.18153788588353004, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002424482153914544}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.049740220187040864, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001561722025312558}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05782059703115125, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016860297998920056}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.044909001327117046, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011943824375694858}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.14594590659077963, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002476347943750222}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1691189101402509, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002588936970621776}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1341843957584949, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017857657209747223}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.18281924229155466, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0029977938731759806}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.21164415433278383, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0031361900114708872}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.16951014920125493, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022640636265336893}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.020335174960559, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06787715772935045}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/agg.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_0.json b/8b7178b44b/evaluation/generation/agg.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..510c35824b9ed7e149ae1df2d6efbff0a3d96c70 --- /dev/null +++ b/8b7178b44b/evaluation/generation/agg.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 2.235702101845383, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.14717774293969751}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.7622052797070503, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.006647669795578922}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.1532954300944369, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0031267049368978316}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.18121867050334917, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018474922816842606}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.7122733552799622, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.007806658717987775}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.07189313722539607, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017250469433453682}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.08752141617950068, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010542837911429734}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.7500255707124592, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.006889071529543362}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.13882842661597, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025055451424711027}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.1698326390033901, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014973431260616968}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.752191135927755, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00685154752320934}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.14346581040848494, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002891637286051436}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.17261995880897366, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016987141071618745}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/agg.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_1.json b/8b7178b44b/evaluation/generation/agg.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..b1bbafb727033c7814d799b6f43e7fb170715130 --- /dev/null +++ b/8b7178b44b/evaluation/generation/agg.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.507959373818647, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.12774308491764494}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5901037503482837, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032159724501758416}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4453954075758376, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0030647232677422412}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.48125855004986695, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023747652067436864}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2860806077756621, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0027716337523015977}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21297260057374331, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002224122053216537}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.23034576083422903, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020975083120057516}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4308357021587011, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003009420690844223}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3212543906087175, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002480078078958591}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.34846752107389445, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021243881165946155}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4830396285828985, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003213107569523447}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3634977467417529, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002819214726631758}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3931631455827191, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023981333184838593}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/agg.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_2.json b/8b7178b44b/evaluation/generation/agg.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..8c9440baa2566d1cd2c952b17eac56b0c15a78ed --- /dev/null +++ b/8b7178b44b/evaluation/generation/agg.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 15.158653678134238, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11217626725691181}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6066145287034505, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003147539042422012}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.48239587619310037, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029532891322940407}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5131292320126455, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002253031761361406}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.3089787427206784, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0028203707876968153}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.24188957715036025, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002292974031208558}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2578530121604481, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021628607938910917}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.44560511468454206, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002995038040318342}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.35193582043955735, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025196283655795136}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.37525966202827027, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021725307399361672}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5064590234844139, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003190583549175626}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4026845079975637, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002836627735824717}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4285131129511556, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024045780604980463}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/agg.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_3.json b/8b7178b44b/evaluation/generation/agg.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..eadb478e30b95939cc2a8ffccfbf9a24171d7c66 --- /dev/null +++ b/8b7178b44b/evaluation/generation/agg.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 15.759812537730546, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.16130432495289687}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6077270325813979, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031150320109689183}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.49124527491366843, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029113142559981263}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5204784544081206, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002251275712244091}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.31332017254120853, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0027772905192189512}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2502643652420692, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023315173133087275}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.26545692823299993, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021835553197599713}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4459205694292829, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029361567575171836}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3592970906286205, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025375120589350396}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3810216920994399, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002194042986121944}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5082193147554575, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003142597202698407}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.41160458845561226, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002840955053130549}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4357908055166842, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024150704709467426}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/agg.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_4.json b/8b7178b44b/evaluation/generation/agg.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..919ee51a442811fa883e231fd870c2b9fc5eb83b --- /dev/null +++ b/8b7178b44b/evaluation/generation/agg.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 16.134799256710256, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1070119918698532}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6054119860771526, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031401965578103136}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4946565816842518, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028364911596105765}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.523909375920506, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022880595790812155}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.3124961122227526, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002808954903697186}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.25220130152340275, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023493523906758557}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.26757332273287654, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0022434333099258102}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.44233843950127705, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029306698549013154}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3607369273273119, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002523691933961996}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.382175935620986, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002236237383536334}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5057660051353207, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003153645376968123}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4139501510871044, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002788136076678763}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4381722454639816, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024443106668905357}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/agg.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_5.json b/8b7178b44b/evaluation/generation/agg.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..ed015e5184fb4f361a3aba186eb8b83bbb0937f5 --- /dev/null +++ b/8b7178b44b/evaluation/generation/agg.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 16.107165763126492, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1725403495293288}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6037882438302521, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00307437348704947}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.49496382545882733, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027753751046680057}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5240001141378704, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022053636458810423}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.31296117294303094, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0027976539566726744}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.25262525126987617, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023072545439166217}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.26817812765923393, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002197626024453061}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.44434419215812615, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002949180064465491}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3625276939571968, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024933568400759844}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3843695820781079, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0022098458849370652}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5068534628215157, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031588710330076797}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.41448240798432473, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027203178472831524}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4393845856350276, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002395852175826684}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/agg.8b7178b44b_gem_xsum_article_DOC_summary_0.json b/8b7178b44b/evaluation/generation/agg.8b7178b44b_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..727ec92cb08ef1370a51f3f5e0e5879a180d510b --- /dev/null +++ b/8b7178b44b/evaluation/generation/agg.8b7178b44b_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1554932484923166, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002221691062513405}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.35841398237522276, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004880460975300627}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.2131475561803473, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002809398976147748}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.036146559262545196, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0012086761533876766}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.08868762877243597, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0030835154047321074}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.05062634534913608, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001690768330530915}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.11383026012975615, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001748646718497343}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2638855275835188, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0038587410761858755}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.15595658881556435, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002127497880378741}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.12373439304630478, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0019078089158618033}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2868552037024372, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004272131408381669}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.16967238254142056, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00237624607133809}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.1587870129118882, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09029922216218629}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/agg.8b7178b44b_gem_xsum_article_DOC_summary_1.json b/8b7178b44b/evaluation/generation/agg.8b7178b44b_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..4e69fd76f7d6fca32ec4030e836acb373fdd509f --- /dev/null +++ b/8b7178b44b/evaluation/generation/agg.8b7178b44b_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.17602273459783957, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0034912567740095035}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2978672198691626, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004325712043489534}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.20475174329785, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0030292857270426262}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.04044850363752258, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0019137570100629107}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06884979773351274, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002724070824860895}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.046694043648379924, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001891957305961457}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.13694272638916472, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0028412360369673493}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2334897227634632, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003556590427451311}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1593397594005996, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0024118116760541847}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.137142234387202, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0029073893715640745}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.23357550407307784, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003728086289055363}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.15946764140405875, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0025141424269190023}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.9813214649410344, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06605541875330423}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/agg.8b7178b44b_gem_xsum_article_DOC_summary_2.json b/8b7178b44b/evaluation/generation/agg.8b7178b44b_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..7817591016a5e6fe179032c07bf20cd1544f3cc3 --- /dev/null +++ b/8b7178b44b/evaluation/generation/agg.8b7178b44b_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.2229374260378376, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004280928411283304}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.28304069580526636, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003972947611177992}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.2303304665083427, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003468001334593542}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.057639208977718646, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002614759341604805}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06850665995022794, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0026514610571335023}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.05750919277461529, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002337201303458201}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.17219483167439611, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003538412807763811}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.21973513766849492, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0033149507650464807}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.17795352717964225, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0028890194692426686}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.17313600638730706, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0035630889990072444}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2218290481310322, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0034301100563963126}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.17909978174756772, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002921283919599673}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.568315279137756, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.13888090668923836}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_0.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b4aa8af95c5bc2d60843866b6b49483970c7fe4f --- /dev/null +++ b/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8339addbfc0b2ede94cb25dc11238a81aaa21283f2803bd36f6486b2d5e6404c +size 3866795 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_1.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..815fe295b2eb19d9da0b6ca6d557dda479a1ccc5 --- /dev/null +++ b/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6382e0a51d013e467a7cfbdeb8fbec4c6e8db7e6678bf0920293c65e978abfe +size 4691205 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_2.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7a7c55e99092ab0512cff916efd6befc8623a27e --- /dev/null +++ b/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fabd8518b73485027526b64535a66a8e0750aa0849fdbb065c2e98a6c67aa320 +size 5521059 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_3.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..73cfc63b1e925b5cb152bb22cea00eeb539434e6 --- /dev/null +++ b/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b5dd6afcaa7477faf4a44fca98f6b7f79553046f8575c0f707d4e4c12229744 +size 6425484 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_4.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d5dfcd374b3e41c66fc2e0b9069bb91d25746f4d --- /dev/null +++ b/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:783b978aacceeb440353f7237c4e5c9ecc63ea0b9eb291bcc38dd19aeff2bb39 +size 7316949 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_5.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7c023ab02018f08095abfbb3c44b0dd9f9cefe08 --- /dev/null +++ b/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d424024c7212898f66db28844f617a72480e72fb2379ca3a337c27f0c00e6031 +size 8202195 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-wiki_lingua_en_tldr_en_0.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6989fe1cda7bba3cfc45b1b91989d255f3952993 --- /dev/null +++ b/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74405f30b53bd6d76c62783114bb60edb313d93fc34483bd2e72c589a9c62cb2 +size 7250720 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-wiki_lingua_en_tldr_en_1.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..17d7bc23d07fd05d519711eb6c1615d7bfa382f0 --- /dev/null +++ b/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:313b14011f3e26d22574a478f82fb992167a2d98a1a63b14cd53ebf3ceec101e +size 13040072 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-wiki_lingua_en_tldr_en_2.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-wiki_lingua_en_tldr_en_3.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-wiki_lingua_en_tldr_en_4.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-wiki_lingua_en_tldr_en_5.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f11605977142b34869604e2fa3935f4f873d3b67 --- /dev/null +++ b/8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69e4d23880302237ccf33e401b7517581aa16962ca935ec633f0c47ea6bd5b8d +size 3787869 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ef995a459be5447e11df68d0ef9d35b3902c0b4b --- /dev/null +++ b/8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1399558ecce70df4bf20714cbb51dcbea1044ce6fd2024ddde5261048397f651 +size 4994557 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8093ba0c8d7b56f4b53f12bf8d2633259ff5e05e --- /dev/null +++ b/8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b56ec148302a38265fe42b1ae6affc50e64b965006940315d1d4fcf0b859550c +size 6092875 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e9f16f651f1a7f74caf56e26c1c1d25dcbb443cd --- /dev/null +++ b/8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39ea06fcb170a3d6bb9812808bdccbb16c93ca0da1609e35d1f70fa0e931d067 +size 7177725 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4c57bf24e04bd58b4773217bcfef5d65c4aa467c --- /dev/null +++ b/8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81034bd11be74be75f8958c567d13cdfd98a67af0630fde5212f0f71a3c3cb96 +size 8258693 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..79005c51d17639627568b9345862a4e74e3cf22b --- /dev/null +++ b/8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d105c01293042b025be040e49eb923792bdd813c868adf51b2e135fa6916252a +size 9345579 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_0.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..05082fcf49b41cc93e8e9174162a47b0401b64d6 --- /dev/null +++ b/8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7873d0adacd52a5c6095631bae0a34012b3dcae266f57054b8befef8c688c84b +size 2806869 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_1.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..9eb6df5f8546fc34f61df096a5e9e9ae54844300 --- /dev/null +++ b/8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0d9292cc62b21da242e84e535547c30b9161725d6c92c3a60631a06b0642093 +size 5031838 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_2.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c002555cfb666e30762a4cb47d501b2a495b878c --- /dev/null +++ b/8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf53cc1d1b0b36b1400ad34fe1ab33d165a9b0183df5b603a5abe07b87ce3f3e +size 7247412 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_3.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_4.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_5.jsonl b/8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-web_nlg_en_PALM_prompt_0.json b/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..cca955149642143f37f0a94ef4ae6b3e725e228b --- /dev/null +++ b/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.4712440224858371, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.041795896662364315 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.08494278433659254, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002682014199464667 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3010315100774798, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005434382926718196 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11420475482093911, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0022183305831393195 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03708415721222578, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0015055606328312114 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.14224175280721357, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0032367826210838984 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.051776101353314175, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012810666933093713 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07986488274116094, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0025364066921602967 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2851084703862567, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.005103727035204417 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10723944522759159, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.002017538602140417 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.08031203138023377, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0025700547990470703 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2832049885841092, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00501983173550152 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10754705129811067, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002066923006506901 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-web_nlg_en_PALM_prompt_1.json b/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..6bb2db7ad6d4c966140edce53a479d379154d837 --- /dev/null +++ b/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6352422858353469, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04386319262846487 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.14729082149250516, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004315116801617204 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.34501701041772753, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004883560454809294 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.17595828606649466, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0037103128590180736 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.0749912603946425, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0029697645981284103 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.17507177387031794, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0035680879509635034 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.08797235452625987, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.002563800160615811 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.13087012462145003, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0037359089786958557 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3214469196295103, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004518231473535444 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1587241385605771, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0031813191221144485 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.13443162008077075, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0038480943977239573 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.32447309188867546, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0044995663315275155 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.16209364614512511, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.003268839028418146 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-web_nlg_en_PALM_prompt_2.json b/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..d2b7c738c26f21d6455ee889a86eee1d60aca25f --- /dev/null +++ b/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.9195810919624675, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04315216107683015 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.19281853446958125, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005348179657635172 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3839239693259562, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004896794421772872 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.21485950562026987, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004330200790716057 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.1059225294754287, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0036916446521448806 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20457409251843786, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0037775743582373947 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.11382579286837109, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0029731216918058084 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.16888883147055286, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.00457575327708451 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.35302151670878984, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004443535122018173 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1905777152487244, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0036266046372882984 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.17526191475368208, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004769580382692894 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.35984651407202956, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004507478564774203 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1966781681343204, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0037869984327305512 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-web_nlg_en_PALM_prompt_3.json b/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..847cbdbf6263ae42ab751901812420ef8a087874 --- /dev/null +++ b/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 1.0349566025343735, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03887674612290353 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.20438835211537978, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005665805208271208 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.39198992418866246, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004947498335222262 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.2237082219543607, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004572034500678942 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.11365499071190853, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.00397252439813096 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.2111302605559281, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003926393767113415 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.1207306381621409, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.003262380279344123 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.17756713475764335, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004833439612735641 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3583014136638203, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004476979554028604 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.196789710556852, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0038281461566836554 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.18556820599751273, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.00508629808674153 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3664900622762122, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004561176586485258 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.20416935580581227, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.004021347054930177 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-web_nlg_en_PALM_prompt_4.json b/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..33b0dca8116cb7945cde79c0b13d6307fbb3509c --- /dev/null +++ b/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 1.1673998473534046, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.09133948510400369 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.2125195111528658, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005730453983133926 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.40637639113635166, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004933922377880338 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.23196338111553216, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004558457306896048 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.11875092253811664, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0039714331213516595 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.22248575515884728, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.004014145150661029 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.12559736589051002, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.003188817274548042 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.1843607825179914, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0048800492055134925 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.370665372766866, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004464677380992271 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.2038615706419507, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003812860468542949 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.19370515184964268, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.005184788234116766 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3806829975264072, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004583640895651089 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.2125920854603434, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.004058013873763605 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-web_nlg_en_PALM_prompt_5.json b/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..6c32a40e5d7161063e8c3acd753b5119a95b38c7 --- /dev/null +++ b/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 1.194760741144373, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.09038400286323779 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.22388107728965712, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0058375878448932725 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.41258053843820386, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004808891702805189 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.24067238350377898, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004627635578763758 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.12470779957706617, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.004011608962377894 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.22396081182592556, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003932938864761309 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.12988590207293185, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.003239297680717399 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.19195297464964095, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004914089701123312 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.37374160359881364, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00433847098671097 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.20930811896578502, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0038259333936250185 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.20275170487892208, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.005253109590732199 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3844755575959121, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004448663215506157 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.21923266732565286, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.004087600756703223 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-wiki_lingua_en_tldr_en_0.json b/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..9e144be5d37b5d75d75bafe906b7a4dedfe413ed --- /dev/null +++ b/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.11259234653795358, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0032411862971363117 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.14340893843595093, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0034694907773717048 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.10762579083182928, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0025835076322910672 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.02582999428983234, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0010000072112516562 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.03784241933814092, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001450453403192633 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.02778920003491775, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.000982242456017776 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.08841484558766141, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0027853934411114305 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1114317644839379, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0027453844256091257 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.08192620888873649, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0019339948879164794 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1068082984161991, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0031424461382987463 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.13490305217744453, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0032803950524800847 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.10120163014874665, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002435237757238233 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.170472303270534, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.09245843828343826 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-wiki_lingua_en_tldr_en_1.json b/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..1d4ac20eae549ceffecaaaf2a064b63fb7b60c15 --- /dev/null +++ b/8b7178b44b/evaluation/generation/slim.8b7178b44b_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.19504169763237164, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.003161655570483573 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2268980166797919, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00336143207911689 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.18153788588353004, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002424482153914544 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.049740220187040864, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001561722025312558 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05782059703115125, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016860297998920056 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.044909001327117046, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011943824375694858 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.14594590659077963, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002476347943750222 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1691189101402509, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002588936970621776 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1341843957584949, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0017857657209747223 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.18281924229155466, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0029977938731759806 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.21164415433278383, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0031361900114708872 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.16951014920125493, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022640636265336893 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.020335174960559, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.06787715772935045 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/slim.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_0.json b/8b7178b44b/evaluation/generation/slim.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..19839fde4f93fdc94cb6b8af4e79f1215cfefab4 --- /dev/null +++ b/8b7178b44b/evaluation/generation/slim.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 2.235702101845383, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.14717774293969751 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.7622052797070503, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.006647669795578922 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.1532954300944369, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0031267049368978316 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.18121867050334917, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0018474922816842606 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.7122733552799622, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.007806658717987775 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.07189313722539607, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0017250469433453682 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.08752141617950068, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0010542837911429734 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.7500255707124592, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.006889071529543362 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.13882842661597, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025055451424711027 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.1698326390033901, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0014973431260616968 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.752191135927755, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.00685154752320934 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.14346581040848494, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002891637286051436 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.17261995880897366, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016987141071618745 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/slim.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_1.json b/8b7178b44b/evaluation/generation/slim.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..8eb1cfe1d822cb671fbc674458feeacad1f375c3 --- /dev/null +++ b/8b7178b44b/evaluation/generation/slim.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.507959373818647, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.12774308491764494 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5901037503482837, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032159724501758416 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4453954075758376, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0030647232677422412 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.48125855004986695, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0023747652067436864 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2860806077756621, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0027716337523015977 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21297260057374331, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002224122053216537 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.23034576083422903, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020975083120057516 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4308357021587011, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.003009420690844223 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3212543906087175, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002480078078958591 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.34846752107389445, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021243881165946155 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4830396285828985, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003213107569523447 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3634977467417529, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002819214726631758 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3931631455827191, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023981333184838593 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/slim.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_2.json b/8b7178b44b/evaluation/generation/slim.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..d16cb90808f1b622e7f7d258c359765e16b18923 --- /dev/null +++ b/8b7178b44b/evaluation/generation/slim.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 15.158653678134238, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.11217626725691181 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6066145287034505, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003147539042422012 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.48239587619310037, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029532891322940407 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5131292320126455, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002253031761361406 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.3089787427206784, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0028203707876968153 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.24188957715036025, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002292974031208558 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2578530121604481, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0021628607938910917 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.44560511468454206, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002995038040318342 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.35193582043955735, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025196283655795136 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.37525966202827027, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021725307399361672 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5064590234844139, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003190583549175626 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4026845079975637, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002836627735824717 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4285131129511556, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0024045780604980463 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/slim.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_3.json b/8b7178b44b/evaluation/generation/slim.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..8e2383a84609bc69a674919f4696e851132864d0 --- /dev/null +++ b/8b7178b44b/evaluation/generation/slim.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 15.759812537730546, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.16130432495289687 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6077270325813979, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031150320109689183 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.49124527491366843, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029113142559981263 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5204784544081206, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002251275712244091 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.31332017254120853, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0027772905192189512 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2502643652420692, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023315173133087275 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.26545692823299993, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0021835553197599713 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4459205694292829, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029361567575171836 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3592970906286205, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025375120589350396 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3810216920994399, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002194042986121944 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5082193147554575, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003142597202698407 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.41160458845561226, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002840955053130549 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4357908055166842, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0024150704709467426 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/slim.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_4.json b/8b7178b44b/evaluation/generation/slim.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..7eb5dc7b0d4f109806f11f2352f113766a5b9808 --- /dev/null +++ b/8b7178b44b/evaluation/generation/slim.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 16.134799256710256, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1070119918698532 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6054119860771526, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031401965578103136 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4946565816842518, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028364911596105765 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.523909375920506, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022880595790812155 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.3124961122227526, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002808954903697186 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.25220130152340275, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023493523906758557 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.26757332273287654, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0022434333099258102 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.44233843950127705, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029306698549013154 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3607369273273119, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002523691933961996 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.382175935620986, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002236237383536334 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5057660051353207, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003153645376968123 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4139501510871044, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002788136076678763 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4381722454639816, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0024443106668905357 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/slim.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_5.json b/8b7178b44b/evaluation/generation/slim.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..830b8143c5c35377cf8a5785ef22e7da4bd2f526 --- /dev/null +++ b/8b7178b44b/evaluation/generation/slim.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 16.107165763126492, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1725403495293288 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6037882438302521, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.00307437348704947 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.49496382545882733, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027753751046680057 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5240001141378704, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022053636458810423 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.31296117294303094, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0027976539566726744 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.25262525126987617, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023072545439166217 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.26817812765923393, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002197626024453061 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.44434419215812615, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002949180064465491 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3625276939571968, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024933568400759844 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3843695820781079, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0022098458849370652 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5068534628215157, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031588710330076797 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.41448240798432473, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027203178472831524 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4393845856350276, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002395852175826684 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/slim.8b7178b44b_gem_xsum_article_DOC_summary_0.json b/8b7178b44b/evaluation/generation/slim.8b7178b44b_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..a4d33a805e1bb90bddfb7db86c697560be2eb6e2 --- /dev/null +++ b/8b7178b44b/evaluation/generation/slim.8b7178b44b_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1554932484923166, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002221691062513405 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.35841398237522276, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004880460975300627 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.2131475561803473, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002809398976147748 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.036146559262545196, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0012086761533876766 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.08868762877243597, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0030835154047321074 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.05062634534913608, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001690768330530915 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.11383026012975615, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001748646718497343 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2638855275835188, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0038587410761858755 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.15595658881556435, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002127497880378741 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.12373439304630478, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0019078089158618033 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2868552037024372, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.004272131408381669 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.16967238254142056, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.00237624607133809 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.1587870129118882, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09029922216218629 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/slim.8b7178b44b_gem_xsum_article_DOC_summary_1.json b/8b7178b44b/evaluation/generation/slim.8b7178b44b_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..46413c20b6c3b00347a56441a04240d85191f36c --- /dev/null +++ b/8b7178b44b/evaluation/generation/slim.8b7178b44b_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.17602273459783957, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0034912567740095035 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2978672198691626, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004325712043489534 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.20475174329785, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0030292857270426262 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.04044850363752258, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0019137570100629107 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06884979773351274, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002724070824860895 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.046694043648379924, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001891957305961457 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.13694272638916472, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0028412360369673493 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2334897227634632, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003556590427451311 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1593397594005996, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0024118116760541847 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.137142234387202, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0029073893715640745 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.23357550407307784, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003728086289055363 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.15946764140405875, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0025141424269190023 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.9813214649410344, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.06605541875330423 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/generation/slim.8b7178b44b_gem_xsum_article_DOC_summary_2.json b/8b7178b44b/evaluation/generation/slim.8b7178b44b_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..544abe718ed8b84dadf656d06caa57affba8fc30 --- /dev/null +++ b/8b7178b44b/evaluation/generation/slim.8b7178b44b_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.2229374260378376, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.004280928411283304 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.28304069580526636, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003972947611177992 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.2303304665083427, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.003468001334593542 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.057639208977718646, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.002614759341604805 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06850665995022794, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0026514610571335023 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.05750919277461529, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.002337201303458201 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.17219483167439611, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.003538412807763811 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.21973513766849492, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0033149507650464807 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.17795352717964225, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0028890194692426686 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.17313600638730706, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0035630889990072444 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2218290481310322, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0034301100563963126 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.17909978174756772, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002921283919599673 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.568315279137756, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.13888090668923836 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b44b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/rankeval/8b7178b44b_0.json b/8b7178b44b/evaluation/rankeval/8b7178b44b_0.json new file mode 100644 index 0000000000000000000000000000000000000000..8c6a7781dd9f40cf0e232ad1af316afc35d6f82b --- /dev/null +++ b/8b7178b44b/evaluation/rankeval/8b7178b44b_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.35, + "acc_stderr": 0.015090650341444235 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.014976758771620339 + }, + "anli_r3": { + "acc": 0.3566666666666667, + "acc_stderr": 0.013833742805050713 + }, + "cb": { + "acc": 0.375, + "acc_stderr": 0.06527912098338669, + "f1": 0.2631578947368421 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909283 + }, + "hellaswag": { + "acc": 0.4500099581756622, + "acc_stderr": 0.004964779805180658, + "acc_norm": 0.5825532762397929, + "acc_norm_stderr": 0.00492130033128556 + }, + "rte": { + "acc": 0.5126353790613718, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5509076558800315, + "acc_stderr": 0.013979459389140844 + }, + "storycloze_2016": { + "acc": 0.7006948156066275, + "acc_stderr": 0.010590117252248801 + }, + "boolq": { + "acc": 0.5651376146788991, + "acc_stderr": 0.008670528471841557 + }, + "arc_easy": { + "acc": 0.5917508417508418, + "acc_stderr": 0.01008556619579125, + "acc_norm": 0.5340909090909091, + "acc_norm_stderr": 0.010235908103438688 + }, + "arc_challenge": { + "acc": 0.2440273037542662, + "acc_stderr": 0.012551447627856259, + "acc_norm": 0.2883959044368601, + "acc_norm_stderr": 0.013238394422428175 + }, + "sciq": { + "acc": 0.857, + "acc_stderr": 0.01107581480856704, + "acc_norm": 0.769, + "acc_norm_stderr": 0.013334797216936442 + }, + "piqa": { + "acc": 0.7366702937976061, + "acc_stderr": 0.010276185322196764, + "acc_norm": 0.7464635473340587, + "acc_norm_stderr": 0.010150090834551794 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/rankeval/8b7178b44b_0_lm-eval_global_step84877_2023-01-31-11-38-06_0shots_backup.json b/8b7178b44b/evaluation/rankeval/8b7178b44b_0_lm-eval_global_step84877_2023-01-31-11-38-06_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..8c6a7781dd9f40cf0e232ad1af316afc35d6f82b --- /dev/null +++ b/8b7178b44b/evaluation/rankeval/8b7178b44b_0_lm-eval_global_step84877_2023-01-31-11-38-06_0shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.35, + "acc_stderr": 0.015090650341444235 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.014976758771620339 + }, + "anli_r3": { + "acc": 0.3566666666666667, + "acc_stderr": 0.013833742805050713 + }, + "cb": { + "acc": 0.375, + "acc_stderr": 0.06527912098338669, + "f1": 0.2631578947368421 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909283 + }, + "hellaswag": { + "acc": 0.4500099581756622, + "acc_stderr": 0.004964779805180658, + "acc_norm": 0.5825532762397929, + "acc_norm_stderr": 0.00492130033128556 + }, + "rte": { + "acc": 0.5126353790613718, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5509076558800315, + "acc_stderr": 0.013979459389140844 + }, + "storycloze_2016": { + "acc": 0.7006948156066275, + "acc_stderr": 0.010590117252248801 + }, + "boolq": { + "acc": 0.5651376146788991, + "acc_stderr": 0.008670528471841557 + }, + "arc_easy": { + "acc": 0.5917508417508418, + "acc_stderr": 0.01008556619579125, + "acc_norm": 0.5340909090909091, + "acc_norm_stderr": 0.010235908103438688 + }, + "arc_challenge": { + "acc": 0.2440273037542662, + "acc_stderr": 0.012551447627856259, + "acc_norm": 0.2883959044368601, + "acc_norm_stderr": 0.013238394422428175 + }, + "sciq": { + "acc": 0.857, + "acc_stderr": 0.01107581480856704, + "acc_norm": 0.769, + "acc_norm_stderr": 0.013334797216936442 + }, + "piqa": { + "acc": 0.7366702937976061, + "acc_stderr": 0.010276185322196764, + "acc_norm": 0.7464635473340587, + "acc_norm_stderr": 0.010150090834551794 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/rankeval/8b7178b44b_1.json b/8b7178b44b/evaluation/rankeval/8b7178b44b_1.json new file mode 100644 index 0000000000000000000000000000000000000000..22895b1470b1d8a5e1c51035d987d2018e89f9d9 --- /dev/null +++ b/8b7178b44b/evaluation/rankeval/8b7178b44b_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.313, + "acc_stderr": 0.014671272822977885 + }, + "anli_r2": { + "acc": 0.325, + "acc_stderr": 0.014818724459095527 + }, + "anli_r3": { + "acc": 0.3491666666666667, + "acc_stderr": 0.01376707539507725 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.2576489533011272 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.45200159330810596, + "acc_stderr": 0.004966736811010493, + "acc_norm": 0.5935072694682334, + "acc_norm_stderr": 0.004901747426331751 + }, + "rte": { + "acc": 0.516245487364621, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.5666929755327546, + "acc_stderr": 0.01392691505275734 + }, + "storycloze_2016": { + "acc": 0.6953500801710315, + "acc_stderr": 0.0106434269886468 + }, + "boolq": { + "acc": 0.618348623853211, + "acc_stderr": 0.008496550741178254 + }, + "arc_easy": { + "acc": 0.6346801346801347, + "acc_stderr": 0.009880576614806928, + "acc_norm": 0.6254208754208754, + "acc_norm_stderr": 0.009931758820410629 + }, + "arc_challenge": { + "acc": 0.2764505119453925, + "acc_stderr": 0.013069662474252425, + "acc_norm": 0.2986348122866894, + "acc_norm_stderr": 0.013374078615068752 + }, + "sciq": { + "acc": 0.898, + "acc_stderr": 0.009575368801653892, + "acc_norm": 0.902, + "acc_norm_stderr": 0.009406619184621228 + }, + "piqa": { + "acc": 0.7486398258977149, + "acc_stderr": 0.010121156016819255, + "acc_norm": 0.750816104461371, + "acc_norm_stderr": 0.01009188277012021 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/rankeval/8b7178b44b_1_lm-eval_global_step84877_2023-01-31-11-38-06_1shots_backup.json b/8b7178b44b/evaluation/rankeval/8b7178b44b_1_lm-eval_global_step84877_2023-01-31-11-38-06_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..22895b1470b1d8a5e1c51035d987d2018e89f9d9 --- /dev/null +++ b/8b7178b44b/evaluation/rankeval/8b7178b44b_1_lm-eval_global_step84877_2023-01-31-11-38-06_1shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.313, + "acc_stderr": 0.014671272822977885 + }, + "anli_r2": { + "acc": 0.325, + "acc_stderr": 0.014818724459095527 + }, + "anli_r3": { + "acc": 0.3491666666666667, + "acc_stderr": 0.01376707539507725 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.2576489533011272 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.45200159330810596, + "acc_stderr": 0.004966736811010493, + "acc_norm": 0.5935072694682334, + "acc_norm_stderr": 0.004901747426331751 + }, + "rte": { + "acc": 0.516245487364621, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.5666929755327546, + "acc_stderr": 0.01392691505275734 + }, + "storycloze_2016": { + "acc": 0.6953500801710315, + "acc_stderr": 0.0106434269886468 + }, + "boolq": { + "acc": 0.618348623853211, + "acc_stderr": 0.008496550741178254 + }, + "arc_easy": { + "acc": 0.6346801346801347, + "acc_stderr": 0.009880576614806928, + "acc_norm": 0.6254208754208754, + "acc_norm_stderr": 0.009931758820410629 + }, + "arc_challenge": { + "acc": 0.2764505119453925, + "acc_stderr": 0.013069662474252425, + "acc_norm": 0.2986348122866894, + "acc_norm_stderr": 0.013374078615068752 + }, + "sciq": { + "acc": 0.898, + "acc_stderr": 0.009575368801653892, + "acc_norm": 0.902, + "acc_norm_stderr": 0.009406619184621228 + }, + "piqa": { + "acc": 0.7486398258977149, + "acc_stderr": 0.010121156016819255, + "acc_norm": 0.750816104461371, + "acc_norm_stderr": 0.01009188277012021 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/rankeval/8b7178b44b_2.json b/8b7178b44b/evaluation/rankeval/8b7178b44b_2.json new file mode 100644 index 0000000000000000000000000000000000000000..566e864bf6972af6202d88bcd90b3e12f4fe43ad --- /dev/null +++ b/8b7178b44b/evaluation/rankeval/8b7178b44b_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.317, + "acc_stderr": 0.014721675438880241 + }, + "anli_r2": { + "acc": 0.358, + "acc_stderr": 0.015167928865407559 + }, + "anli_r3": { + "acc": 0.32166666666666666, + "acc_stderr": 0.013490095282989521 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644647, + "f1": 0.3558162267839687 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.44911372236606256, + "acc_stderr": 0.0049638729368579396, + "acc_norm": 0.5975901214897431, + "acc_norm_stderr": 0.004893814890208308 + }, + "rte": { + "acc": 0.49458483754512633, + "acc_stderr": 0.030094698123239966 + }, + "winogrande": { + "acc": 0.5651144435674822, + "acc_stderr": 0.013932814110418025 + }, + "storycloze_2016": { + "acc": 0.6996258685195083, + "acc_stderr": 0.010600915927985021 + }, + "boolq": { + "acc": 0.6204892966360857, + "acc_stderr": 0.008487341975756834 + }, + "arc_easy": { + "acc": 0.6418350168350169, + "acc_stderr": 0.009838331651451841, + "acc_norm": 0.6296296296296297, + "acc_norm_stderr": 0.009908978578665753 + }, + "arc_challenge": { + "acc": 0.28498293515358364, + "acc_stderr": 0.013191348179838793, + "acc_norm": 0.3293515358361775, + "acc_norm_stderr": 0.013734057652635474 + }, + "sciq": { + "acc": 0.918, + "acc_stderr": 0.008680515615523727, + "acc_norm": 0.919, + "acc_norm_stderr": 0.00863212103213998 + }, + "piqa": { + "acc": 0.7475516866158868, + "acc_stderr": 0.010135665547362362, + "acc_norm": 0.7453754080522307, + "acc_norm_stderr": 0.010164432237060494 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/rankeval/8b7178b44b_2_lm-eval_global_step84877_2023-01-31-11-38-06_2shots_backup.json b/8b7178b44b/evaluation/rankeval/8b7178b44b_2_lm-eval_global_step84877_2023-01-31-11-38-06_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..566e864bf6972af6202d88bcd90b3e12f4fe43ad --- /dev/null +++ b/8b7178b44b/evaluation/rankeval/8b7178b44b_2_lm-eval_global_step84877_2023-01-31-11-38-06_2shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.317, + "acc_stderr": 0.014721675438880241 + }, + "anli_r2": { + "acc": 0.358, + "acc_stderr": 0.015167928865407559 + }, + "anli_r3": { + "acc": 0.32166666666666666, + "acc_stderr": 0.013490095282989521 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644647, + "f1": 0.3558162267839687 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.44911372236606256, + "acc_stderr": 0.0049638729368579396, + "acc_norm": 0.5975901214897431, + "acc_norm_stderr": 0.004893814890208308 + }, + "rte": { + "acc": 0.49458483754512633, + "acc_stderr": 0.030094698123239966 + }, + "winogrande": { + "acc": 0.5651144435674822, + "acc_stderr": 0.013932814110418025 + }, + "storycloze_2016": { + "acc": 0.6996258685195083, + "acc_stderr": 0.010600915927985021 + }, + "boolq": { + "acc": 0.6204892966360857, + "acc_stderr": 0.008487341975756834 + }, + "arc_easy": { + "acc": 0.6418350168350169, + "acc_stderr": 0.009838331651451841, + "acc_norm": 0.6296296296296297, + "acc_norm_stderr": 0.009908978578665753 + }, + "arc_challenge": { + "acc": 0.28498293515358364, + "acc_stderr": 0.013191348179838793, + "acc_norm": 0.3293515358361775, + "acc_norm_stderr": 0.013734057652635474 + }, + "sciq": { + "acc": 0.918, + "acc_stderr": 0.008680515615523727, + "acc_norm": 0.919, + "acc_norm_stderr": 0.00863212103213998 + }, + "piqa": { + "acc": 0.7475516866158868, + "acc_stderr": 0.010135665547362362, + "acc_norm": 0.7453754080522307, + "acc_norm_stderr": 0.010164432237060494 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/rankeval/8b7178b44b_3.json b/8b7178b44b/evaluation/rankeval/8b7178b44b_3.json new file mode 100644 index 0000000000000000000000000000000000000000..523165ebe15060995ff5b8315fbb7bf6c8726018 --- /dev/null +++ b/8b7178b44b/evaluation/rankeval/8b7178b44b_3.json @@ -0,0 +1,73 @@ +{ + "results": { + "anli_r1": { + "acc": 0.313, + "acc_stderr": 0.014671272822977883 + }, + "anli_r2": { + "acc": 0.325, + "acc_stderr": 0.014818724459095529 + }, + "anli_r3": { + "acc": 0.33666666666666667, + "acc_stderr": 0.013647602942406394 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.3995062282572102 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.0440844002276808 + }, + "hellaswag": { + "acc": 0.4510057757418841, + "acc_stderr": 0.004965768348628053, + "acc_norm": 0.5970922127066322, + "acc_norm_stderr": 0.004894801119898596 + }, + "rte": { + "acc": 0.5090252707581228, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.569060773480663, + "acc_stderr": 0.013917796623335966 + }, + "storycloze_2016": { + "acc": 0.7124532335649385, + "acc_stderr": 0.010466744473098368 + }, + "boolq": { + "acc": 0.6204892966360857, + "acc_stderr": 0.008487341975756834 + }, + "arc_easy": { + "acc": 0.6405723905723906, + "acc_stderr": 0.009845958893373764, + "acc_norm": 0.6376262626262627, + "acc_norm_stderr": 0.009863468202583773 + }, + "arc_challenge": { + "acc": 0.2858361774744027, + "acc_stderr": 0.013203196088537369, + "acc_norm": 0.32081911262798635, + "acc_norm_stderr": 0.013640943091946524 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/rankeval/8b7178b44b_3_lm-eval_global_step84877_2023-01-31-11-38-06_3shots_backup.json b/8b7178b44b/evaluation/rankeval/8b7178b44b_3_lm-eval_global_step84877_2023-01-31-11-38-06_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..523165ebe15060995ff5b8315fbb7bf6c8726018 --- /dev/null +++ b/8b7178b44b/evaluation/rankeval/8b7178b44b_3_lm-eval_global_step84877_2023-01-31-11-38-06_3shots_backup.json @@ -0,0 +1,73 @@ +{ + "results": { + "anli_r1": { + "acc": 0.313, + "acc_stderr": 0.014671272822977883 + }, + "anli_r2": { + "acc": 0.325, + "acc_stderr": 0.014818724459095529 + }, + "anli_r3": { + "acc": 0.33666666666666667, + "acc_stderr": 0.013647602942406394 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.3995062282572102 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.0440844002276808 + }, + "hellaswag": { + "acc": 0.4510057757418841, + "acc_stderr": 0.004965768348628053, + "acc_norm": 0.5970922127066322, + "acc_norm_stderr": 0.004894801119898596 + }, + "rte": { + "acc": 0.5090252707581228, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.569060773480663, + "acc_stderr": 0.013917796623335966 + }, + "storycloze_2016": { + "acc": 0.7124532335649385, + "acc_stderr": 0.010466744473098368 + }, + "boolq": { + "acc": 0.6204892966360857, + "acc_stderr": 0.008487341975756834 + }, + "arc_easy": { + "acc": 0.6405723905723906, + "acc_stderr": 0.009845958893373764, + "acc_norm": 0.6376262626262627, + "acc_norm_stderr": 0.009863468202583773 + }, + "arc_challenge": { + "acc": 0.2858361774744027, + "acc_stderr": 0.013203196088537369, + "acc_norm": 0.32081911262798635, + "acc_norm_stderr": 0.013640943091946524 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/rankeval/8b7178b44b_4.json b/8b7178b44b/evaluation/rankeval/8b7178b44b_4.json new file mode 100644 index 0000000000000000000000000000000000000000..f9eb6f4001448997675647a5e48561e5dd55009e --- /dev/null +++ b/8b7178b44b/evaluation/rankeval/8b7178b44b_4.json @@ -0,0 +1,54 @@ +{ + "results": { + "anli_r1": { + "acc": 0.311, + "acc_stderr": 0.014645596385722694 + }, + "anli_r2": { + "acc": 0.299, + "acc_stderr": 0.014484778521220477 + }, + "anli_r3": { + "acc": 0.335, + "acc_stderr": 0.013630871843821474 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644647, + "f1": 0.43401043401043404 + }, + "copa": { + "acc": 0.82, + "acc_stderr": 0.038612291966536955 + }, + "hellaswag": { + "acc": 0.45140410276837284, + "acc_stderr": 0.004966158142645416, + "acc_norm": 0.601274646484764, + "acc_norm_stderr": 0.0048863535635718415 + }, + "rte": { + "acc": 0.49097472924187724, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.590370955011839, + "acc_stderr": 0.013821049109655491 + }, + "storycloze_2016": { + "acc": 0.7097808658471406, + "acc_stderr": 0.010495529690730063 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/rankeval/8b7178b44b_4_lm-eval_global_step84877_2023-01-31-11-38-06_4shots_backup.json b/8b7178b44b/evaluation/rankeval/8b7178b44b_4_lm-eval_global_step84877_2023-01-31-11-38-06_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..f9eb6f4001448997675647a5e48561e5dd55009e --- /dev/null +++ b/8b7178b44b/evaluation/rankeval/8b7178b44b_4_lm-eval_global_step84877_2023-01-31-11-38-06_4shots_backup.json @@ -0,0 +1,54 @@ +{ + "results": { + "anli_r1": { + "acc": 0.311, + "acc_stderr": 0.014645596385722694 + }, + "anli_r2": { + "acc": 0.299, + "acc_stderr": 0.014484778521220477 + }, + "anli_r3": { + "acc": 0.335, + "acc_stderr": 0.013630871843821474 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644647, + "f1": 0.43401043401043404 + }, + "copa": { + "acc": 0.82, + "acc_stderr": 0.038612291966536955 + }, + "hellaswag": { + "acc": 0.45140410276837284, + "acc_stderr": 0.004966158142645416, + "acc_norm": 0.601274646484764, + "acc_norm_stderr": 0.0048863535635718415 + }, + "rte": { + "acc": 0.49097472924187724, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.590370955011839, + "acc_stderr": 0.013821049109655491 + }, + "storycloze_2016": { + "acc": 0.7097808658471406, + "acc_stderr": 0.010495529690730063 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/rankeval/8b7178b44b_5.json b/8b7178b44b/evaluation/rankeval/8b7178b44b_5.json new file mode 100644 index 0000000000000000000000000000000000000000..695dc1109ee2126324544599d9325ab42b53cbeb --- /dev/null +++ b/8b7178b44b/evaluation/rankeval/8b7178b44b_5.json @@ -0,0 +1,49 @@ +{ + "results": { + "anli_r1": { + "acc": 0.323, + "acc_stderr": 0.01479492784334864 + }, + "anli_r2": { + "acc": 0.302, + "acc_stderr": 0.014526080235459548 + }, + "anli_r3": { + "acc": 0.3375, + "acc_stderr": 0.013655897185463648 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.3081617086193746 + }, + "copa": { + "acc": 0.73, + "acc_stderr": 0.044619604333847394 + }, + "hellaswag": { + "acc": 0.45269866560446126, + "acc_stderr": 0.004967402792744857, + "acc_norm": 0.601274646484764, + "acc_norm_stderr": 0.004886353563571844 + }, + "rte": { + "acc": 0.5126353790613718, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.569060773480663, + "acc_stderr": 0.01391779662333596 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0 + } +} \ No newline at end of file diff --git a/8b7178b44b/evaluation/rankeval/8b7178b44b_5_lm-eval_global_step84877_2023-01-31-11-38-06_5shots_backup.json b/8b7178b44b/evaluation/rankeval/8b7178b44b_5_lm-eval_global_step84877_2023-01-31-11-38-06_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..695dc1109ee2126324544599d9325ab42b53cbeb --- /dev/null +++ b/8b7178b44b/evaluation/rankeval/8b7178b44b_5_lm-eval_global_step84877_2023-01-31-11-38-06_5shots_backup.json @@ -0,0 +1,49 @@ +{ + "results": { + "anli_r1": { + "acc": 0.323, + "acc_stderr": 0.01479492784334864 + }, + "anli_r2": { + "acc": 0.302, + "acc_stderr": 0.014526080235459548 + }, + "anli_r3": { + "acc": 0.3375, + "acc_stderr": 0.013655897185463648 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.3081617086193746 + }, + "copa": { + "acc": 0.73, + "acc_stderr": 0.044619604333847394 + }, + "hellaswag": { + "acc": 0.45269866560446126, + "acc_stderr": 0.004967402792744857, + "acc_norm": 0.601274646484764, + "acc_norm_stderr": 0.004886353563571844 + }, + "rte": { + "acc": 0.5126353790613718, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.569060773480663, + "acc_stderr": 0.01391779662333596 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0 + } +} \ No newline at end of file diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26f3015deabb23cec0e47a3c7a5164d827fe86aa --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9be540ee4c29022c913c913379438dafaf3e9335ab9c112093a27ec55512e0ed +size 208731415 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0252910cdebc2541d1d856183f380eca59c34333 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a097a3938a224125281435074363be898d321d9233088bd3966a4ab74ac69549 +size 208731415 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c5714323819103e670dd7512e880ead02d1bdad --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:697adce478f66b6ea60b5602f193c3682bf692fbc97ab1f3b6acf8aa398730ed +size 208732183 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d059f4eba27157eba91931a69b957867c364d1a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d31645e636732755fa2e9f513af812d31f3d8f5aea688961037dd417d646218 +size 208732183 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3820d08a461906ee8ca7d58de818be16fc7966ec --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22c799ea35f76bd2d0402cd037f9b7c8bb52ecc20129319271edd16efcffb4af +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f185c9c63ef805f52bc7774994228cf46c8dbd6 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7419b83354a83981d680b03d083345ccb1b731cb892e682398bd60695a068c8d +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_100_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_100_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a31f10cf70bd1188f6df68a71feecb3d2bc79f4 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_100_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55da256ad91c5e802a5f302015ce36fc706f8317473f4d3effb87f87380929b6 +size 208732269 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_100_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_100_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..abf5eefda2294ddb5d879a62a7596827688007e1 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_100_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d311c7dc1df18a321fde42d08a619a7afb6f3684102ec2a6bc09497374c470f6 +size 208732269 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfb013141b3d89109d64cb0268fd5c9111f199f1 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7357f87951e9aa149925f2051441b2771448a10c7cec7d8b049a867b643f0043 +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec314ab33fe6c4e50a19b3d78e49dbfdf7cedb44 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f480cb7282c0d97ba5fefef7046d46687b37dd1e82f513845d8ac54c3c38b339 +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_101_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_101_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11fbc6cf7cecf6f5438961794693676347c2361e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_101_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b230a264bdafaa006b6fcf61efd8bfc5b8b45cfe9bee9087897436db0a922e51 +size 208732077 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_101_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_101_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e83167fd6b85f366e5bb45578a352b1d65d14cf5 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_101_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a645da5ec8eefd8d316155719e07ff23e7664106cf657a75244409f6e808f52 +size 208732077 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b906d26daace0238b8f39bd9d92e8aceaf1af0b5 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4b66bbe9055d7aa58931eb533205a2a87712a06e911791151533748d1e1629b +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89e7341a76457438e71469dca437697209aefda6 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11add67a347527d3c9dc477b7ebf9bb4785208a7a66d00a68fefaa9d64676fc2 +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_102_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_102_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0788215dd9c9d6ef2f8e2618372d32bc8da22395 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_102_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55f4fb1353dc2fa0e0e7167ad4c72f6066b3c0aadc58b55d55529925d7283b26 +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_102_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_102_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90d12c333bb41c66c50c8de604464ec36f43432a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_102_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be98e3ae42d4c2911a35ea164023163b40f8f1dbd8fe98c9220eafce1c66016d +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c26f044879594e3c29e53327d07f63ca9bbd671a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c30be40d78e98b7f787be15ca8283239ec67a25880a86d74ed43f391310d74a +size 208731373 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..693e02fcd88743cec6510983aa5f2af900b2acde --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dc8dbd9b5ab4ba8299c180728e45f8d6dbac473639111ef04658e980d366dc5 +size 208731373 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_103_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_103_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8616209e6e58559fae8f6ffdae34821764a15e9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_103_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9dfffba79bfcc727f69db00ffc1d53ff2b5d08424f7e6c399e380f15fc3cf61 +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_103_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_103_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f38347d7ea6a0645338c4119ac175fc51437e947 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_103_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39469915ae3376923691c43791833ce074e6534ee7ba73788f44413b6efb8196 +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..feba7e69ccdd10699c8a5e67b4348c0c88230fee --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6544d7e17be55623615920bedc71826b1200338f627e327d4e2e43f2b89b7806 +size 208731501 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdfc8ace186d524803295843fa460cb251594718 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12d87fd7d4d5058a73161b1b075fc816ceb01bc0317c18f1b57e7c41bb874931 +size 208731501 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_104_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_104_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77c7d0c916c1e37c9b83eb8c2fa02b300da4af7d --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_104_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b1ba25c7bcacc5230685ffac074b8746b01502067771b6ad6332240f5494e65 +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_104_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_104_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71743fe0eb6b4eb6432aa3a8938437dfeb670d83 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_104_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12b69a791cf7d37b26bd89ec4b36411eb80f961195d4c11c6e3698d412d8fd85 +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd176a38fd1ca8b209471206837f0a3989129e63 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7da77df73b274030b018d7fc64bc498f6ff2b3036b4bbddb990fe44c8b67aeee +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f46cadea70d1a3f2c49418875f39b3932382cd9f --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1734e1f91ddc3ddbf412df7a556583ec5cfebb9d7bdeffc97b5deb83399cee59 +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_105_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_105_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddb8842f083bf545cb473e0099b35a3efe613f15 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_105_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd025f63937606d4e4115975bfe72904e20bb1d6306f67a6cb90971b0ce593ac +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_105_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_105_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5d551ae8e9aec862f84e460ad157a3e0c8af4e1 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_105_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f829faacc4965e12eff609647ba5ade45104cf84a2c05ad68977adde19d6133e +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4deb88b9c808374747afef303d02458fc2394338 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd3c476d10242972f690648558cd847997995cc96e6b0df12ca7d026f9b65878 +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..777987d1807a3279d7caa0b2307df39a9751714e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:652e28c354635da5e66cc37e69701e0f67e6a6410b0fb29445b4314c5bb516d5 +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_106_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_106_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7fabaaa902d3aa4f8c30892e94acb94400ebe03 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_106_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d6c2a185344166df38715253b74d3f9fffa45fc6685359f19b83dd313c47aa +size 208732269 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_106_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_106_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91606a2bc8336ae32c62b023640e9f5e53d2f632 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_106_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3280f1250c5581e296ca918c14371148217d0ebf36e4e19625b0c7944049c0f +size 208732269 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aaf6db3194b8a5418ba498797933c0e4489efc7b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:367ea7fc434f1b4b9f5cee37fd5f39d0a93187cd668e40393629457a08fa5745 +size 208731501 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..236b63950de05b22796b7dc70058fe9e100adf77 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fcc17015a50518210447f2c3d1176de4838b8975e2ec4a71ac92b0e485fbb5d +size 208731501 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_107_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_107_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf232fdfec214f08dc94a9d26cb8bda695538af1 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_107_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c2cf9dc0dbfe963f594f9444724d22b3a9b9bcdf1ad262b1ca1d6977b35a190 +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_107_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_107_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27f9a3c3ff138ecbec3b848699f68df1e6bf2d35 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_107_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:347a469ee68cbe333a498488b1f765adfa3e62d283b43fa672780893217e1a71 +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fa7d231a33e168e4bca886206eaa316ecf1769d --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be6576a62fbf43a0bc107d39ac5eaff0d0148991f5ce37b4dcfc56665c32a76b +size 208731373 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bb1d02c17c0f9a4ecefa9d747c48800dce3501d --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b6786768b207fdf75400b11b65e3da8c64819526593b55d82d8c24752ac41d6 +size 208731373 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_108_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_108_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd73e5e5e256c9b4c77af70302a2a0bc545fa974 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_108_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63d6001f55061839822db3656d155aaa2e40d111133138b7a404cfd334002dcf +size 208732141 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_108_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_108_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42e739d57f1694d543786aee2add58d56866f91c --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_108_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcdfb0e94461e31a53b6f6c749874a782148683609015ed950c686bd610eaccf +size 208732141 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57b86f81153b4266f1db46990035948d7b38dec5 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee1ed46d56fae493fff1aea05efa1dc928b99f993cdc42751b0f6ddf55dc75fa +size 208731373 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af5baf403c54e5c2108b5b2f0fdd5bc133422979 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daf2c9df57b16d6936fe6be9f57c6c155601e5569b45884874252bc4ffaecb90 +size 208731373 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_109_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_109_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12eacc4741ce6abbb6f3b94440ccb2d42c4251f1 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_109_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1f58e4fcea8a57c14053074e663731319a7ca8a5c6d44e969a8a5644110b9f9 +size 208732141 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_109_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_109_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6eb2f2281db91b5343d2bb43adb9d12987fe7c50 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_109_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbd8bed738b04676820e42da2030386407fb86c941c878b1a105d0f66e9065e9 +size 208732141 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cca022e8ac3162e6ad5d2c1a580930cbd90ac5e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f369c71aa8524155b9c6948730db17798216e112b3c9c2fd2b373ca25b31c65 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05126b3fd4e6149a81c38f4d5c3e79c9e298a09d --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:637fe52a3653cf0c7d3209a7499e11b5503d8bf05308b5caa21075afda99bcc6 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c087069cd6741d2489627946b1d6f96ea6ec4fec --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b6512c983d12efa0379e25f6998470d052a490d7c1ed0d27a4e0450676055e7 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..836c8f534ea7e06db1140e540ffaae2bb1c85e77 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe6ca76fdf14050e079a4532747c4895ce7e3235d60a19ae5a48ebc3397e41c8 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc2caa72e330f89e1fe99337d84dcae80fc7d7c4 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fa8767475bc9bb83686c07996e65eff6778f20c1f000b0fa631ede8f71815fe +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c6686e1d43b0c653d013de64bf21f7cf5bfa526 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ac9e3722372c7ec87d1fee7cba56207cf1ec93164934aa4f63c2eb034effe2a +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_110_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_110_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81016d61d4d80cd410af5c8589efe59a5449fbb7 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_110_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1464ca2c89db59f00a2a6c00d9e1345a119879f8b47147e8fc3c680c7127331 +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_110_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_110_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a412d60e0fb89ab970a76ba8662a89e6ec17f0a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_110_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9de8ae8dad4d776bc9bc658e574e2daa2fb527a291bbd517f48d407acbcae7b +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63f7ae0c16a7953dc65434d0151bedd94084095a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c508c5456dd02a82d0cf74f56d9a50774c01eff888d6535697a4864f9ad6abc3 +size 208731373 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9045cb9600fcaf107dc9c5505e6c3cdd84bab810 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0b2b1e3ea45c786940cffdec7c99fabcb9ddb61a6f301a8dbd962687f1fca94 +size 208731373 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_111_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_111_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55e874925cebf2180a1886e75ad76d548caf002a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_111_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90158f3ada9e6fdaf174d41142e27f6c16dd0f2c740bd88a937d442aff0a35d2 +size 208732141 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_111_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_111_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e88032a9b46d5c423cf5c865a360af781cfd5050 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_111_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c93b0624a384810b9d7d84b18c802019028da1db44765051dc9d65b856599249 +size 208732141 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f04c3933dffb3f88a7c1641b06e12a847c983f4 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21ad464b8bac96531ff0f9cb698fbc0f6c532937cf2e596af5a53025aa7183ff +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3829fac767cd72cbe58924d508539fcba739706 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0337835bf7f9552f9dce8018285351d79ab2bd2433349baaa845f1a83bdb49af +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_112_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_112_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a47699652a1e6b6d655eb2cbffbc35d2f8b52921 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_112_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d969a38b1b1db1b72270a338f429aafde37a2b48acd680b6e6bdd1a50a647a2e +size 208732269 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_112_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_112_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..142cbf4601d7f40fd8b8aa03bdab87855b945b30 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_112_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8765472e4fe3ad378ac0c9a6333b03a081e125fe867f518050e7efa03536044b +size 208732269 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aaa0efb6c3bce3a1317f15a24b87a640dc49d226 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:810e8da849228a3221bb7ac387defd54fcf0cd1c2fe9d44b5738cd862ae3026f +size 208731501 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0ac1c9a1a4d32cbaf8acb31ca3db1a2431a2cb5 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db81d2844294e09350c74b54320ebf717850481b9c15099ab5578184b31efe21 +size 208731501 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_113_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_113_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f4f047d414ff3462ee4ee25865b6109ad74f77f --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_113_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa21ea99f690d5bc1ab5349465c17103ded35d577efa2b37559b74379472a7ee +size 208732141 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_113_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_113_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d245f9f2c41e9c968fb2f23b001a13a0ee2e44e2 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_113_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b13b578839db752271a0bd847015ccbf8042298cbcbb642fc4590d5cdabae85 +size 208732141 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c452aa9a7ecc73c6be7491080ccca32262cd4f23 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2011ff743993cf590f48896ca72cd7ce7eaabdb77a5c916959ba5beae99ac474 +size 208731309 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82217061f6d5d51e9bb5a21e5b2c941efcfff216 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7893f523b007312e88f25a0c4d496d41cae397dac2e9ed9cbc74d8a39896bb44 +size 208731309 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_114_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_114_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8691675390cf49e9636955123c825e0813cd2f25 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_114_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7fac91bb00a7be9cfc4b3cefc91a924691a19db6ef4c85bee1af70895b37352 +size 208732141 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_114_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_114_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5826cbf268d9731158e276f5a0be24f5d78f20d --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_114_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4913ef8565cce9722bb2b720cdc38bd8dbe0d9e443ad1b4f756d1da0669e9542 +size 208732141 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5685bc5d8bf9fc83017dcf0ddc5bdf0ef660ba47 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5bc53ae31352bac510e0a560bd19e479ecd9305ae496afb723ae76e49252a60 +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..731e009fda026b2f8b260c9a2f1a8f371ab17a94 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88c0479d51573186c240d9c85b2099f6a3752bca6489f338d23a609b3b7cfcf1 +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_115_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_115_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bca20ed211580f2c65134e692cbbb8bee88051e0 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_115_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baec05a20f1d72e1d9cef59d4a4986cb29d4d0add14c474812bc7d58a64ccd0f +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_115_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_115_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6ead654b1a7beb01712f6cbcf58302da944afc6 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_115_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29191311eed4704139fa7217387ecbc54e13e5e812a040d0e9251a790104a136 +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cab13be2f5fa3c46765db2ad4630c5f356187a9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a48a1622bfdd65f3642ba0fa13f12c12a721c70b9d9d0d2753ae8758b0f77065 +size 208731501 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da3338d5f9c2ae3230f960ad6b0c0760a5f853a2 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8673dd3abe132672baecbad7c673fe3dbe0b39fa7512d2f1ee701134979f5693 +size 208731501 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_116_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_116_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbf43aa2148d47a02e362d6389b81ddc2f643eb6 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_116_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a96de50187619d66ee6492e51c633c743747dc23288e2df688a37d188f4d8a9 +size 208732269 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_116_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_116_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fedc4f594a8768c07e12942cf3f3bfce0b24d86c --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_116_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b54202db51576b46e49951859e108ea365b30ca1a8009e14b434deebe2a49ee1 +size 208732269 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cfd18ecfccbe663499d38dee2ff63e36189de30 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64b07cec3f62bfde8d21c10008d88b6007545f674ab78b986c757d7a8ae7530a +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8c12e73a2135b7c7aca07cbdd3534c3d33ccc82 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b33b2d518990b84c4bce9f98571dfe1b7304b2adf79170133fbf689c53449a61 +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_117_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_117_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24740a014c3bc4ad71c98fb15fa220c3b719e2b2 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_117_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f531b2d0e61e48c581b3d62b6b1dc32d1c598fbc212a6dc8602f09eb66a50074 +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_117_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_117_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e02874c2c1033573cd4f2a679d9fc193cdf4686 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_117_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93f5acf524780a778f78550592c03c5fbdbac8971a003a4f02da64ddbc9f8b44 +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9793a6c8d71c6d466c655d14b3d3ef7cf45d627 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74aa56e54214622dceafb5aecf5f0e0fd680688d93b3081aa7524b58f7fe0d9e +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ad1780442550db83be7a83210104a01f12d394a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62914d790b9c66dd1d59124f82c6c1933002f05bdf4c0d961408add77d2cec11 +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_118_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_118_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a0328fb83e539d24f60eae8efde260d269f0430 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_118_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8427bd33224445c066bc535eb13c5f533654d50d5e51489add19350bae7ed27 +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_118_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_118_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d622ca6799e2c6434e254b50ee46036fd6278b2 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_118_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9da898ae98a91c1ec81b4e2d97ff6f2b9bc20eefb1c78c22ee721cd171434c82 +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..353720dca7b87cdf1f130f440738a5f308e38cb7 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc4c80d20c9a3c346f2f3bdf19fa698bd65a7eddf72099a5ba36cc90f6952908 +size 208731501 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06b9ad703d51588a95c33f417df633424b689449 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81484b20510298bebdfea40c25840c067be076bb618aaacf3c12f4313478d798 +size 208731501 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_119_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_119_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46c5defc1aba31697f6be8224abe3ac96f8dd7eb --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_119_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aba319d6bb8ecaaf0deb64a531bcd5ab9222068ee1bf3fcec4927ceab89767f4 +size 208732141 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_119_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_119_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7bfd69ab43285e0af14eb92e1d0d4288787ba7c --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_119_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea19b76e303bb2fc43a3956136fb1685a7c0554792f5b8bf5c712bd97c374748 +size 208732141 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6091b6beaabab8337c0b612afc12f93b742ca696 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71031eb80824b26a5031abf41db79cb3171552e8cd63ee684a52049133263735 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6da1d7d22c282c8fefc541c9a57bfd93ca6856c9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a61f8b226b2b29c5149e359b8db4b6a82736eabfbc2ec9fbc6ba58ea4e5e219 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fac15b08dc8da9a3b7988db9eba9786d16068da --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38a8cce905a4ab57cfc79c9781386ded839f293b5eabe309a79aa7de9457f243 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..571308487a35e182b5daf1af2b9510cf72a68210 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40bccb70cc63709dfcc10f38c8fd2387d72f8c465541ff6488c1f19df46ccd50 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b09589f3961242c7d2813e0b9fdb73d0c01aa78a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d54739ac657cd08bc4feadddcab0a5ed8b953f2bce88c1b4adcaf6d21ef88823 +size 208731373 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d965ce451863b1f274635473947ff88af46795a9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb5e9ffcfc658b342b974b620598b4a5bfd59600ae7063a1e493ef690298c549 +size 208731373 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_120_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_120_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cb55b220404ae11aad97fc8c19b519fce03fbf3 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_120_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f216e073b27e5361ab6ce859c19e315a7a42a9e25253a46b07a43d71f14e6e71 +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_120_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_120_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed1adf06358070066626d2875e3d7bf01efc0de9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_120_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57ef1d3d0a07c576e2aafeaccb2d62585672f027b12c6508d1c102ba1b219108 +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31ee9973ad61a26e7f90f179951ad09a5e2c7304 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a1b5f69b9cfec82b453c5ab4be38451185a59bf3f38c0024f34fd2bf0aa066b +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9825cdc827391abab2f114ef8b424ab12216c94 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1669380d3b48cd528e2d347b1e8edf036a10699e5bd40d3e6588d37e9c82f15 +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_121_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_121_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c388ae31534af59b0e92d25d5d7e996dbf8428a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_121_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e6aa74a1396bbce8b9bc4627953af0b2f76425e7e25feb113cf3314d90c8fb8 +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_121_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_121_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..856356850839ca6ada13be189a5cbcc94555794f --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_121_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09cc5221f1aceb309a507ec0e9b117a99d4247f92de883ef2884bec9ca5ae529 +size 208732205 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb164f888818338eaaabf731aba87c98bd5b533e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e78d474819883c900f7fff85cbe54eab706cb8c929c522e0964432155a622347 +size 208731309 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c35599d167101a133ce65a8a8d3bdea826af49fe --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f60340b87d0fc9d484549ba3a028d3a5ac9d8dd01e002131ec4322b1df97557a +size 208731309 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_122_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_122_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25ce79944fe56adc0a12ecab4aef416d77e195de --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_122_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef0f28fce5bac96399acf634dcf5cb70d864dc9634c7e1814fcceb8d09bedc34 +size 208732141 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_122_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_122_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29243b92017fe33b91fd27411fc9d1dbd02703b4 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_122_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf59d8e677e8d949e597a4eaff0cceaef56a0c6b7b21039fe00bb56f3c259f28 +size 208732141 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85542999736ff8ce60287fff3b785d4f6b10859d --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41fe08250903a51185af69b6154aeb3c83b148f4b615818d16bbda1521727d0b +size 208731373 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..888fa33f8c355e57b3b1e9390ecd482d15515a1a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d559ae6510639c071e6674acae05b09c7138397ebdf62f2e990644f701118223 +size 208731373 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_123_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_123_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9fad3b9b047362878b7682d79ee19307a70eec9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_123_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c4d86f6b2f312947718f52f9e4f9df14c80b3456958bca681f41851d244b620 +size 208732141 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_123_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_123_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1666fb404e1f2648874bd4b0fb575c933257b0f0 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_123_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74b413fabefd49dff8d708a4170d60ac867a438fa6ed24d656963b7d16f872a3 +size 208732141 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ea10ee0936fdc6c12d3628c4908c19bc94f0648 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3314f2101d7c594eaaebedc254664887d4b3526180c24db3a22b656bb837a1c +size 208731501 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..456099f60e48ae8522145b55713b6a3751547330 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:849cfc752a04264a2ba17748b699a2eabe05f033774e1845ecdfccdf085fa84d +size 208731501 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_124_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_124_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91ada37fcefd0f9fd62149b46e57bdd16619c51f --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_124_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c9857aae1049e2e5ec303cc47725a806e9ec11f96105277e04bbd3cd5076970 +size 208732269 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_124_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_124_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ab6d245d055ceec19681142551e9c7430128c7a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_124_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22867a11fc9d3693e0bf6a34bf95cca2c658b8493f5db27f3fdca3e6de86d199 +size 208732269 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3db75f17cbce3a932cb65aaf2e4cd8d5ef5a1f33 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1714a2b693a885de205052eacca6ce570769318a4d801207ad6d29de12d0a1fc +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..121d9eacafc3c9a1dec546a36aaf5c2d6c7575c9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a5676b0b30a05ac2b2c2e41e6e3cda28b1df841168587fa5d2fbe1742efd4e4 +size 208731437 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_125_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_125_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54346dcbc780345edc04a907f1086437350572e5 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_125_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb17f950859b71a6762c9d109772abbc5a9fd6b454d65bffd217d4b18ff6d91e +size 208732141 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_125_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_125_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86d61a1533e342de447d68131aa76498d421079e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_125_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8b3ef8e060fb1cf9b458f1d1544844a67873c107d194661abdbfa6bcac2a7be +size 208732141 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4617a2d1307e1ec67cae0e4f8142affd37b9b0d9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ad048fa40b6dd44559902c03a61634eb82eb755fa6234eb83b4e86fd8615d53 +size 208731373 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9dad56196a59e002cf2b645f3ad75417b349fabe --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baeda2109a2dd230404cee7782c47e7f9f842e5e48c680c992cf26e9b5d87f3e +size 208731373 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_126_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_126_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2c14fa6561985ae60c49cbd79baff9ff31e5f6b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_126_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca4d4be84a1f9cc4fdab00270618a69125ca77a76de6857f43066de6b2a330a5 +size 208732141 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_126_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_126_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b00f41c1afbf5123d7df6689bb904169d6cd974 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_126_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17cbe71a8675f10eaebe9bb6b982e8399834435b47edd98dbfc7ba22a7da8998 +size 208732141 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c790eb9c16e4bf2825b6cfec0a4f648644d32c9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:736894607f9fe7462e1bc5bccaebf6d90be31c59360f1140f19e6070f34ff9a8 +size 208731373 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fddc2cb005645e18a534bff7783f99680784c35 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3854a8272fa6d6d31f695a193d49aa3d9efcfe15f2066aed995daa4ac46a9ae2 +size 208731373 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_127_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_127_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..baef0267e27fad797ce1f9f90baf79b2da36313b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_127_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d997ef241af6a02db1bc9bd3a205ec4bbdecfbfc9a5fd103c5b6d6710aff107 +size 208732077 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_127_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_127_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d78ef1130bc194d60ab9f54d7bde5a4136671b8 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_127_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26454d5053bfd9f56bde791add1365ec4587f25844dafc73c3db6e9b76f28130 +size 208732077 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f5128766c2e0e6ba6d9200a2c54f2f0d0d189bf --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04d4319616ca07675dd305c48143f076f639e69697a617129941b81fff97cb8f +size 208731554 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79df5ecc9f36712fd883a730bd0e536e00725884 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba02f7777212420a40ce655edd7dc78cbaa475453ed90dc2cb3c2bc6ee82290d +size 208731554 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7cf3d2542da8f5913e55ecc09265441e3f7e376 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89f6df4728a6a459f3a4b8f44abd87197086580c96d5a756364c55eba8789e8f +size 208732322 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab326ee3f8b5404247f177eeda6fd8bef3ae5e96 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c9974dabe03bbeab02a1e20968fef13b71e42514ca15133801a279d12fdde82 +size 208732322 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b739391b96c7be252d2e98c6174e6b8006f82b5 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:110fa5099b1a716ebc0dc23dc217b4ca510f1d9746c78dbb1a77c8887ea31634 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e09600985c93c14ce82a56b493f4e62a71fd93b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:269dd89133a3d252e10d5295bb8e657ef3c5283382b62120d8a690a39c92a86e +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd974689fa5b6631a395f3ff76db45d0170fe472 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed55041861cde74fa8b8fea7e42d3681d2476ecaac60260aabd2c7252ef4cfa6 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cefe5f5579380fb0d2bdae805ac24f020bfb063 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bfd28b413c3140857c487ba54f601a121bd15291f94ba50cae44b3b57873b63 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..416b02da777b5b7918a98f9ae41210c9d9b06d4d --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49c8aa28747ff75591d7a7be06feb9a32c218b48a5174e0c1b27c25ba20a4c5a +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..204a7a95c01776dd5c11eaae8a401bcbc756ed5f --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb38b9d5f60e5db3296ccd26191d7e218a354c2c067385536d3407c756e0c78d +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..880bf01cb8d22e7f468a9e465fde636883eca41f --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a94fb61c531f7dc28da530f2952e76d00c3be72e1d623992101202d8fdc6dffa +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75f5b6f5f2c8c1242a03f1e5aaf837881fd56547 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75e878497c8c79b9c5675c295c9d04b61e46af87d728705bad1c43af58e016a7 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cbc2b3282e0a189314ff99416663df1246419a2 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64905d794fd1a81e0f7ecde2380e7ebf7e795ec81efe59efb12f6b19d401ff1b +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9140b505a53e7e73a6171b63e8036f981670b22 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:380a1571d1c984a3cb100335e5d702021249311e180835427a94a3b9f05c3de1 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f136589ddb009f87332c0c9710646a09bdaa257 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1ce06ca3d9d649a4ed780610ff2a7719a28cfe4923f33762ab3a8cec9623ea2 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa15d54080a0ac8616cf2bec1d8abc91f2f22aa9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d4d2791a5b8c70c5d0eb1311b87bed8acafe80deebe3b9bd7360d9359dda7be +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5775073834683ebcd896bc4dfcf9883260d1e21d --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f625175ee681c4afdd51a0243e6c01ad4bd4034ac94d9d89bb6d14dc3f733dc8 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b26b103f7fa26706f519e9a1f47d1fd2b8598af --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7a295ca6a29cb68f129833369cc89aee950ca7c26ea938769422816ebf3463a +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_16_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_16_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48e5762155242ed094bc8f5a2df27852ccdc7f95 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_16_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5f787d05f7fc5166128df6547b4dd2b4edbc6f25f5c0a43bcc4212248f93234 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_16_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_16_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d55939c35c5789995c09640fbc347453834a1a78 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_16_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64ac0e7435010d5902fe37d9f321f2eedb8af972fc87502d16b60bc5b4204791 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..365164fe733c67503a632436725b59bc6c504271 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8ff2d96efb0352ccfb2d62c97d9a18ff68025b1cf314f3af6d12f0ee0bd2ff3 +size 208731298 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bbb93649ca73fccdf1579e27925190aa0645a2e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab5d8307bd38d61cc48a72fdabc99dba4839eebdcd5f665a9ca705da30abd68c +size 208731298 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_17_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_17_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb1ce0091647dc0de0ba9af6e73d6d0354db4549 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_17_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8aa8c2a3ce0df52009c4884bc5c6e8d673dfd50247320498d00bab8613c16da +size 208732066 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_17_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_17_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a0929098b21ef5fabe8c01414351e7a636abd52 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_17_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba8de9be0f4d8e3a9a89062964ccedae272358fc99f4ba7b7072eb930711dedb +size 208732066 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aad28d569ce6006d306e465f74c000a90330b83 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c6fbc703c16c49ca4cc0d1a6a047f4599c449ed7379cbc1662df23e984debb9 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56a27982b648b231df4853ca7ccda53d00dab850 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8f7804b44c05748a71b6903969e642e1ad91db6d64cd3a03ebdc0a5c6d3fe9c +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_18_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_18_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e360e9ca08773952f0bb5af91ef3ecbd7d12594 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_18_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56bbbb1ff4f6bed2c321cd55f23b03418bb6dbc2b685881318b6cead256ddd4 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_18_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_18_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1d1cd6e3e50e5492bf1f72e7502538f988612a4 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_18_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15cfb2a68ded6f435f1baa7ffbb6f2735e0f150d25337f3f464286ad4a3b827f +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed19000a50c63a474d6594862cbac0344d2c6cb6 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:882f7f5ca9ad0303ae87b06e4d358c4c9c056573a2aa713365ba2e98cc125053 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..107aba4bb22156d265fc71aa449eab750ba4cc08 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aed3f46b104c85ce2c75f77cade9f56aacf066399f69bf61bb2d84a1bb5ffa6e +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_19_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_19_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b08b90ab52689e7de49fd78ff76bf038d75fba4 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_19_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d124f9a5d5c190d700e2922d37e85e0d7bfb23ee1688cadb95a743a55507e179 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_19_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_19_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19433a042527fbc74e516a6b39593e0d293c9be7 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_19_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:025258ee221ab4ac9ef7a3f0bc0322f3ba6c95bf18be5c957c11fa093ccb3710 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2fcdb0b0bcb0245093a33ce888f6c0340abf882 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:999db372dc58e09c95435ff75ee649e99c514a4ff95cc3d704c741424ac606d1 +size 208731351 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a9939c3b014d7575f84cea2f1f0367899ff321b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd1c4af5817047621934d527d245473c0534e29abbd7ad77e4b6e5b33a5f82a1 +size 208731351 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da0febf1c55befe3849f238ed655c4650eb0686b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:291dbbed0f8b8f19eedfb4821415c183be11d398325b76f8fb5bd593c0719b58 +size 208732119 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0198de2da483374a6b36dd95232b84e7e7a4686e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e8d434a7dfab63e13bd11e0ec4751f7975fac1b1a36860e1e1061d3a03e7d17 +size 208732119 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc356251dabae03f4aca276d246ebd806304423e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d54ef2a8f625be32365115afade2a79057f693c35b1e032a375d170d863d9aa +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e81639eeb1d490be91bc87503e99bca46bc8d70 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0241e4e8b63aa005519d450ab981f381a53a81fd420df9428c52a65ef85d3567 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_20_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_20_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c464d93a1741b7529e6556ebff0b57bd980d009 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_20_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b33a9a157b99708c065fcb19afd194303d99f479e3cbd782c4ab97b27edfee3 +size 208732322 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_20_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_20_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1f152dfaf2450c951bdf5822613cae775b4454e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_20_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cc95c7737b866c7eb3afb01fa635dab3086912e9b71cfaad40ea47f0747c71a +size 208732322 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67ffab30aaa133f221abaa5a2efe331a033bc4e8 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3de477dfcd3e9b134b13a62bc122e6cd1cf5226423e0b3a1795577e40c917d5b +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73a42e6df90be75d4616712c971ac407a4436206 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8af8bb0e65fd8b5e290f662ad10602eb8e01984d3f3e9f864a021a1f8cf1351e +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_21_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_21_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c704b153adb44862c8ab98ca40a7633ec82475e5 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_21_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7468c0ddc4b70950b4d20c1a166e4b31da4c25864ee5f0caf77a3e2d6c18e4e1 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_21_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_21_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba9aa97a14f8aea56158a5cccd226980e8eed1a0 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_21_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:730b62721a18ceb93f23a129a9547813a60e677b7a7d7531cbcbb954fbf86c07 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..891fe48a4c3bd479c7681d8336db3d8ff119a77d --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bbf1a9422517a6c26c0ec30780652f1844150f798d94f71690725fa30dc0356 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df736ff19e86b3a3ea71fd4310dc6d562e0fd905 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52a527343a4e393f1b7b0704ba15a522e8548a84e13299b28ccda15afebe4301 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_22_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_22_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9b70217b836ba03304d554964be71ec27133c4e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_22_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a86d933899482ddab00e8a3f80616652920c3c563166d5f95534f13f263d7c48 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_22_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_22_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e672d827b8814e87f2dff8bbd67d23de9663f5f --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_22_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:098bbf6ce0d16ee518d3cb8bf3b12f77f661dc9e07e5b6290ae3a0f1ac8c4ab4 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24f257d3004b771e7567c442d17709dc9f2f39c2 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01f7e8075d46fb3206b30b25f8ac6e6b9aa89076d412f98c426005934f91a6ab +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7af2bcb173a6703d40235708c4525f80adb48c9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44918f32c0b95a1c0d075783ece3210a70d4dbb0f114228257c2cd40a7827fee +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_23_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_23_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfad69f4f16d6911e200c8178f0e2ae0cc9308ed --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_23_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb1724feb93c721def40a558a9583c78067d06fb4bf8a8e5339cf9fb4e159a93 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_23_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_23_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..234c47fea7bfa111e827873cb96a0e77af07c5ea --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_23_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8c8b054d32cdd9f1c426a5172a9e0c7c394b7ef22f23bc93075f191729c243e +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5baaa0c5dcaca09b95c95e129d2e45e95c1129a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59c0763cc43c1c7063387e6968549d8c8138662beb7c260d0f3d7bec515584cd +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..702af5633ab2c9395319bbc3ab5aa4ffa97bb89b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:050511a6aa93d412da28a0d716f0615fb9beeb3837abe1fdf27d6d82c2d12181 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_24_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_24_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5ae951bccfb95e0f35ae82299aa6bdf17a95f51 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_24_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01678309212785514b68c91319f383d8ab2929c152fa86601fde4efd9fa3f060 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_24_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_24_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce2dd698c83e2e9df3d39481f105b392e1ee9659 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_24_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b248b57417716a13c0bd5eb76f481c8785998871c10c94764f821a08fd8db3b +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7a48b038084791c71e504b7d9e30bcab0678b3d --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e31617aecedef74af02578b8596ba544f06da39e6ea87a3afb0b9a6887289828 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90b046acb6f4bee7f16942a52488c715b72c135b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85d0d33714dc8b44eb225ec05dd778e0b31ba3882e6aab5b5b5ce4c33380c78d +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_25_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_25_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f5d209a5077e25b893864005b56b63b2a053770 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_25_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1c5e7fc6b86723e73b96160e9a6fb731d1b069fdb39b35d0ea7b0a16039729d +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_25_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_25_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c20687e017503229ec1746283fee9b0d349b0eb --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_25_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ee8ef8495ef3e3fcd6e7412e7d136478366220bba6e7c5f50e2299cfdfa7951 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a5d33c25aa8df8e782b2959dd7a8eb00c8e40d7 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e464b5e22a9f93adf3b4166348c6c2a1c56692dcd35ac7dd833257c1e1f1dcf0 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83420a5563076a4ab29358d28ae008780130b738 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ca4ef37ed9538beae8686b622193d09998b8a320224de98db4e4a7fb4211619 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_26_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_26_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0c581975f6b7fefef5e79e3c63b4f6635c9e99b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_26_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98353d62f6570749f6f525db34f62330e321c2550ae09d629085612cac17c940 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_26_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_26_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4581e2c305679000b51034f08b3b021334259de2 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_26_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e7b82f4f964d73dcb32f41c5eead6de2c1e22ce1216beea983a1b1bb5002df0 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c085108b85f840469f850d015fbc26fc86c4a05 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bb296cc7102797cc264d4c945ffd6bc10380634f30647dbe86c142c471da1d1 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e735ba96e07772abe204c4de24b5fd60868f0078 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b847b85d2a243fcc8a712b3c91f385a0d8a7673b271676944d6a30473cc97bbb +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_27_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_27_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bc6d425365573bfa4345dad61d8feb857cc9dc3 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_27_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8245b72c0205c9a47ad6ce2d1652b33c7bea1332019ba5c9881ae0016cd7be8 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_27_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_27_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b27090e619632dbdea276d246456ea57e85daa16 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_27_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ef3edb7d5ab4489aa2b78463113b077e7f9aaf4d73ed78d12e50bfc10efcdbd +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c62927fedf6589e68f56d4756c9da5cbf4dce736 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cddc2981e8743e0b6d98e0330e1ad5829e396f129ee0c5069e62d60b0a0ea62 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f10426078991e6dd9fa22d5a5e5a1aa2a3fc14e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b18edf029f465eb964ece17aabaa65c102bf0e178d6b8f58aec1c10026f6d12 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_28_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_28_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ddd7b8cdf5d32ec3ee927236199fb16138cbd9b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_28_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12f51e0d8c352a32eee9d7c21e41217430e8f982134509b338ac226460182b50 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_28_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_28_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..600955c121f44dc52251badb94eb83d7544a5138 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_28_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9811c2d7655a610d9298a148d687e25bc75fc0815cb019b2056d2a8b14476fb +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0857cdcdcfa23b2f6b0e3a7085583f21371d5fb2 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4455f0cf4708d1e28997cbc5167a1aff2e288742f583c95a0a1d11d519f8e9f1 +size 208731298 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d39830aa9f3217edb6fa562c38d8ab14a99e36b9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3fc23b6c8940ed370046c4040f93555f0ff62a265f8608d1a0f76f0a319bb63 +size 208731298 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_29_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_29_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..979310e0d684eec621e5096f9ad5ba526b495b4f --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_29_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:190fccb150f06d794475c34bb3e86dc783560bbb3544ee9b5c488384019c9bf7 +size 208732066 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_29_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_29_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8587da6a57f7e876dd741b2cf41755b8b8fdbcb --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_29_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:344e87a73049f155dba0cab81a7fa45fe556aee5e5bb59b0f039bffffeb9a7ff +size 208732066 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ee3b2e87b32e93426bea45cc76d5ba66dac6d32 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4df3926e5839664bb0b9b645d717da88dd262da90b35e1d18fb064c398ac425c +size 208731415 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11a2782d45fa2dbf1184e75016664c306beee526 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c88deb9946a62862e85bad120898953ceed1b89857f25610ad0055e52a45c9fb +size 208731415 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22ca9f97cf3733d1348682bb063f3e6fe8d04970 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b4889dbe6d627e9f05d3f6ec653934d3a9a18cd93ca5c6599170ad49fef8b76 +size 208732183 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1079f89d49e970d1ca558f55504996566198a0af --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ced78b9d6f561148c90f700683ef9cc2208460c92a13aba41113f746c6255cc8 +size 208732183 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ea0ac71dd0247f6f0e2c7463e46a9c6dc14bbd5 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e6b9f4dff645662b35c457124c7bc0d507cf61e987fdd9d906883a1a8091451 +size 208731298 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a31047efd03263d695cb0e65ec7d5d9218ebd9e0 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8796d7bb082451820671be6823036f33defbcb9cbf2673c00e07dbb1c2365f69 +size 208731298 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_30_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_30_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ce665efb626a54230f22814c94b0b7780bf2618 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_30_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b26d5fe6b45afacc9f1d6102e350beabd70bd92ed4f3ab572b2fd51ed941920c +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_30_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_30_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03b9233749d3507cad5830caabb41b4fc72f843b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_30_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97176a23aae6bddd15aae87a48e93c61cbfc0224e53646716b150dd8cf8da535 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9609a8e7d3edd25e8b86db6acbd49a45817a3e88 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cda57c4358796e0d8973d3ee5ee0b05fda583025384dc6e8fe8315a0773eeadc +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1071caa4192775fa04a88cf85ea92f65a1fadc33 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cbf5dff51e9c233397832b04de1888ff32909bd0277e6f6e8c68812d7dede21 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_31_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_31_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bebaabdd30200f3bedc500f639bed5210d147b5 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_31_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f71c48d1eebd535d9ba980ee24474c1c7f4a461fcd41676d1017cd6d61a1bc97 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_31_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_31_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99c5b0c89f7d06fcd192c77f38e08e97854e40d1 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_31_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9d3b3586220038ac457f5141b36264f67b2b812000c9dd5d2f086e3c7bc3e36 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19d632a82f785871d819c89275b4d0c20ebbef76 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b74056aa6ab1e4f68e24e039e85dc2eefbeca4f5c945536be5d0df501fecfa3 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e6bf64bd4cf83d5abfed49096eb250c82b5dfcf --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de4421c36c03ee3198debb95d1f5252c18d08f82f3f35368b45f5fb64619a5f8 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_32_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_32_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2824f33209f802e306c956c03f64ab8e1c8efb4 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_32_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc219cc1cee6a678839be8b57fb74055b4b8bb8ae859b970cac36b890d12bf57 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_32_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_32_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e48a817a14747ea2c55ca4eca5e3d82c6e5e2633 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_32_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58de6d52046bc9cd8c532918971c21ea45fcbe7e066b28c271ee283d40d737b1 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b82984f224c05333c6313bd2e0eb06f5b4b92f97 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c66c193089cd35c4a445bd22d7e462d508193e193209608987dbe45c4f386066 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0efad056fc11c5d43962aa20621a7ed556c1d1f5 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a9e94d58072d2b3c4b4e143d52920778e506435db787be876dacc125a8296df +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_33_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_33_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b8fea560572bdc8968c51ebd56ab893f1175e2a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_33_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40568fdd5509429b34b32aba383c0cb9b9259828938c58f15e997ca9a78bfda5 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_33_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_33_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df1b4772bd607455ff0498cf29476c35012529b9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_33_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1069ca345ea467aad15311190ef31c3b9f8c90852619014bf7435b6012b9962 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc2e54230681eea8218b212ec838b6e88974d4d7 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50423a050cac6a93ae04206885f992cc9061734662d83220298d55410d9f1636 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8895036df301a087517a0b01169e212813179a0 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a64d284f09661cbe441dc7b6e67643d466e99979bc05343aa38c49cd0e346d4 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_34_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_34_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d93bfaac4b87b1925e18f621d33ac5c3bdfe749 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_34_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cda5bbabc3c9111834c88135df7c18a7bbb6e044a21e22a1502f83092a61ec3b +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_34_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_34_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e5380a437b3da85e5e1cef47c3b1095d4093b74 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_34_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c81a953dbeeb31edb34f6530bec75e516fd7ad61758298de637d6eeecaca0405 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57d16ec1a117de7714c953affe2d53b871955fa8 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1f32c232e5a00075dbad1830d77ebb13635561d8d527fa071d2c6330214dd24 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..532ba648b6e7be1a4b0b06c6c87779a06ca774a1 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:580a1c6eb146cfe3221fbde6d7afaf3b6fb8c1d0ff91053375e5888535d66423 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_35_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_35_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f4c79f94706aa87d83ec4d835bdb18c3f4a8d85 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_35_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fb882574a925962f8bde594c8e95589b5ce766f9a4899367ee2f7b17fb81843 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_35_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_35_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02e56fb7f83f6c180db351becb807de1e26df080 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_35_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:643c7236a591a70086fdd7079dde293091ba25d97f22cb39a54bbdcb595716a5 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5454c79be0ba0f4b8314b81ec3e99e70ec12fbd --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f76af0819d154e4aa74884f1a991168f4c994871771b738ef7cf223fecea440 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c88bcb73491ab9c962d99d05b6d084414e3ebcb --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c08b678967c8b311782ab7a45fa0baa986c899d717b88d687feb8eb48c5b441b +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_36_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_36_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc5df21a3a706377069f18a9ba195f8043a146c0 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_36_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7e6b57a629d19c9efe39f1ee5ce4ecfe1f0f3dd06f6c2be73a985f25bbada8e +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_36_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_36_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7540ca16e0bf3da52c88f035e250ea43c2bd40c2 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_36_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a68f64616ff87a0a8f0f416660cff9a5c34ff7b27e29cf2b60c8fc29263e6c92 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c12bc929c6b1cf3a83ce4787c78dcc76bc561e5 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:928d55d0b647b7791e7dbfea50bf17a1329403e49dd25280381cca46c41f610b +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a078270de89589c03c728f712e8621da9ead642a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e636503f47c6d9ecb717ce6405f5cb309ffea8e3dbc66c94743808f518182fb7 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_37_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_37_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e84c6c63122982f1b689ca1f4ce767ab878efdf9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_37_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46a0b58bd82239de8c90204869483e0173084ee69083275c6af17ac51c476ce9 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_37_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_37_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..053440047ff92258229647de6e8d4c644eb7ba9f --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_37_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2f26f781a2131ca8cf5c9b7c67e40fe3288ee8ed8738a70e144b5716314a18a +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3e6c4ae33469b62fff5dccb8ca490e9e9abeeac --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bebc8ccbe522a761fb8c93b26fc4cf56cc0649d880004135ffe01bddc6ce52e1 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..765c6360b38c76bd1a28bf001f0a18b7c39aac93 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a0819cef06037bef352f2c42e1ef5a50a1cc7ebb78e8664e8c12ac32c8b3fdc +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_38_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_38_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d217416e4e2ea1cce976c14b3493d18907e8ab07 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_38_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa8dca3772ebe58ce22ce6479cd40eecd1afb09ee587e2aee6417e70375a644d +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_38_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_38_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3606339c4c544fc457c242c4000b6085bf6da5f6 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_38_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6d36555bfd72c9f45780049c2e9a30319d5b47c5511674009f02696bb75f2a2 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ada641247a0b07b6368d1ad5e1668dd63f94b901 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0536f10c8d3d25177f74a56babafe0e673c41a2287d6b2fa7f368dd974f4b529 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..444698b69a02cf68682dc9aea730c0088675d8d9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fdb800ede0e424f9da1fd0c6e37c57e3b409286da3e82c487b8aac4a25c158e +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_39_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_39_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70616a26ccf4dfe4d867f3070debd9612d27272a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_39_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:429a6f4dfdc24ad4cd7b371934d970004d89fdf122311ada6bb345a9d37ea79c +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_39_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_39_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad20b5fb356572e800cbe06090f36ea0124336d3 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_39_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4c24490241616a7e4031cf226577c40d69bfc9dde17aa331a0c5f96c8913dcf +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..404e78c1bc5572cd36204f543e26dbd077646b42 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0efce67e5bc3226cbc71f2ef6f2cf6fc129378205d05e17df13fff2b43ce2c7 +size 208731351 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a8e592151715922034fe67b877076d8ec665741 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f38136b0ebddf7e08e57c23e17a8dbefa63e4662c530a46835345878d03343c +size 208731351 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6dde7d0059904896fa05f6404523b208f6643ca --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e0fc6c1cfed41b3823ade4007511b6372d2c5f5cab61769e085cf87eb693700 +size 208732119 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7593c6eb387a892bdaa358fde8f17dc2970e5808 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aea720d3ef55530db79ed1a5ef53b93c39c913a310ca7d9b737c8d9b68c159ec +size 208732119 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b97750bde56fa17d8a4a7b3503e2a33e26e921c8 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0dc7c47d486802b891689a71feccb797e7530cf7a58aa92bc308a408abed746 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3e85c0f490e6317c8c1bb77c40d7e227002a920 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dc1e640ec58c34a5fd86acc8bf763b9d1333ab7f012a0fa36b8d3c5b37843cd +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_40_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_40_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05acb03c48652c8b10da3f45c07cc89c6d9a1dfe --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_40_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4898ce9394e3ac3ff80e69c23b83bdba2165c0b7a14859cb983e4068aef69c0c +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_40_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_40_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c65400c787af53ac0258545304f96d31dac9e5c --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_40_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7507062bbc5745f4e49a3be790be1c922c7dfa942160690fd5ca7da710f70a0 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e443700eb035d9889eb855e907cc543c5c2376ce --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ba1286b51397a5fd637b6eace9a07906c295404da5fd4c468fc13d547a8dc6f +size 208731298 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0ae50190197ad797a2d01f1504660265852335e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feb23681b53706b0b34f299848ef83f310bcf6dffa8b8fb2e424c832b00c9ea8 +size 208731298 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_41_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_41_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a417377036c2a6185a43e5e2a4fcd3dd08c382f --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_41_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cfd9bbf9181cddfd278f0595bb247e891159df6cc33e2cb7e404a2962f47a8a +size 208732066 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_41_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_41_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e25eb24eee885d3a274207fe515ea4ed0d396ad --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_41_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e419d6f7a5f6098b2a40e1f86a487698aba6439d632434e53fa334796faabcd7 +size 208732066 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c8277b45a54c5fc130858e5ec9d55f10fa7c7c8 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92681d09beb4c87fd60dc48df4221de3330d53618eb0e07e8c99c58bab0a8577 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ab406186349f739224374bcb2edd68706eaa6f4 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f890cd65dac4291096aa00c358facfbe7f1037facfb8334f2b36aa6027bb0476 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_42_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_42_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe3b817558cb61d1c2ca12a1fde2475e9c25c514 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_42_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f5a15eb47d0eef93608a0b3d5790d90afcb2d9d469498aac6d2b5ce886126f7 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_42_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_42_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f09340ef32f68ac11fb9d49329fa200ba1f28180 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_42_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ea6c2eda906648add1465acbe5e1158bb18984f4b02afdeedec579359641d28 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c746a239a26b642df2b8169b372cf6c2bbc2e187 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6923f4d9ff47edeaa15cb5e121f7c4a513a1d9d709ec43fc087fa5653dcf37a8 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35739056813a980471157748124a529470bc7c13 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8619e4139f78fc630d3c8d5ba149ab98de0cfa3490f4def4cda06fea73edba31 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_43_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_43_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61b2ef69088fffb4f3ba2a8ec341ece9a3a69ce1 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_43_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53bc2db2d4fd8b02769bcf44db82f643ccfe7e2906e532c821878433ce1250bc +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_43_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_43_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d074a57b4301491e471cbe461eced95c73908d1 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_43_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55d53489ef6bcad6975bd3d7216c3650ca8a8d03565a599f1a71a43c7d3a7ca2 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd240230ccb9ddd1bccb13ae4edb0b08c1c02002 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e1e5060552c2877dd14885074f61caf110b7e758c0d0d765ed038366ed2d6d0 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64bedeff4d59248fcf1f138a8c8fcad667dfd6b8 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8109900bf4b5f44ca43784d2f852240e2ccec2c5d683e940bf94291f8e171780 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_44_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_44_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..126c90de5e425cca878a633cd96281aa9e60775b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_44_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b1efeca554c5761f8677b5f3ae2bbc4d0304f85dccba417d18871ef399e0417 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_44_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_44_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7002bc27b378167fe028bc59cc86da9506826e28 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_44_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ceab62a5b8c312aae900408e15d1a36977e68fc81299be3f8e06c37efcd29ab +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8965f9b773f10c9ae90e771df9b549ad0696999 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9459b450e9f58437b40165490ab69799500cc96134e06982f8ee78e0d40cd8e7 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86c25cc04d2fc2750d3b05933fe45f435697e098 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f509704b08f3a86ab0ee3f8bed4d493b2161eba180b766098f021b88aeff6d3d +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_45_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_45_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3728e22107786cfb73cad797248c742a8f16fafc --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_45_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24ce2dbb97d2e73dcd65c39415e61433f418207eb60a6315a6e9b85e0913794f +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_45_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_45_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14588bb62db49c12484b4fee8f645e53b0bf1357 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_45_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2665dbd0c0609d4ac8992d1ca49eca03b9037bda050586aae854bb1b8bd7b0e3 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb88895588939b5178cf4a17709d229488611af0 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd8eddf8f637cfa224176d399c8e98d74d867a3518eadf3e4c3a6b1ce46c9050 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c5b8a21298c1b85ab49ec99098af05218c54123 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45b21277d366cfc0956256cf61c4027213fd271f397a0398d5ac8f322ac12a0f +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_46_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_46_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce1a448de1778caccc14258d8479a01a08896dc1 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_46_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6101fef9837e7b2fe58899fc8c5e2b2dd3b288e5655ec29205137b4353200333 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_46_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_46_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63b63726de2a8104a0100de0a5e98e61f9c6ea82 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_46_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10d0704e0ef9e9d19478b832ef8bdd592538deec72eed3f1580e47a2d73aa05c +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd89be138361bd7d3a49674b33c1f6e348155b4c --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f1e5cafa893e3e047cfb3cda2b6921db53a89255f7b21824dfa9e7348926bf2 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c27fcb08e2200520fc89d8621a3ebc3bfac2de30 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08bf12e824fd2bf51deaaa942c2c23b5868fff2039194aec945a149b0c4313b5 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_47_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_47_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a735fe73a5778c2612d96db07957a479caa480ea --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_47_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28dedb8f7f01597260bf53f63436c7b5f8e8ca1cb52a6b2a3ef9dd99db3b9f61 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_47_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_47_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a472253214a0b3d76618e9a55d063ab26a0634c9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_47_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c946a12fdd13c30d19b6a061d3867487898abc9fd0568b3c8beb1ccc9da9301 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4aa5268dc116449831a57cc844f67390b0e1ec3b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ef31073faeb07eb4bbf60b910d31371d3843f1512ba7bafcef43c428f3f6f72 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..211b08f3bca5171bb096c2f499a15afc9d0d5da0 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4e7ff2383c183057ddc679747970e22ddbfe5cffd5f3443c77c71186482f645 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_48_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_48_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0ed0bcc5fdd55557cddc0e0a0652e858510973f --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_48_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4834144ccb665586ff41f4010102fac766cb6050b94ff7cbf60005f5cbdd0640 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_48_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_48_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09df12f9d93f4df701826b0a3e0794ae2803e993 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_48_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8914410491c21ebfd81127325f57be8788771be9c74996efac55bcd5b189d0f +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2f53e1770a352045772f1dd34208face699a23c --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4aab7f798531f2ed804f10a9c0cd9e71aea272139fe37f79e6fd234adbabd4fc +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb5ecb8fe4379ab960b13f48bbb7bade285c8ae4 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12b860b2d3cdb8475c69c491b75b7638d56f43a57bc0130e532612ed2c23a120 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_49_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_49_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7864451bf20f5e8def223eca8a656b61b617962 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_49_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83669e1791191f74cececdff4bb9ebf08aa84d6c7e57e77dd8fd386316adc6e0 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_49_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_49_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..adc24ea8dd936df556d1963ad22bdbf30f9ceb04 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_49_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5bb83adbc1ad8547089b301e871a9153ecc10f6387fea8c68314ed33a6be727 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2da931ad9a25e020c1c4863740fde6fab6ca2a1 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13e9078a897ef523891496fea277d17e4c42eaa15a5da6b392bae0d40d0c2e5d +size 208731415 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6c9b3253c42ee5ad1a07f73ff06de37fa3c9b43 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3a1409137caf174b304e206852e519c6d3dcd80a7d6e232b63c0079b3324a36 +size 208731415 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8233ba9769f4e9816ee4b4855d17883a89682ba5 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58dd32b69c786509addfd00c04f66aff2266a7cf2f4a3a5bb62ac31e9eff2002 +size 208732183 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67cc00a7ede079bacf868209f61a706d1a2c33ab --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f18042e2c15c6f708a7049db0120dc0b6883eef4907c12e4ad6a9e7682ab6e6b +size 208732183 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5328a1adf057fd1b5b0c3fced9f30d12c4c44c5 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:368393138277be5a94d4648dc9e6f0f4b47d00100996d013f6f7252dabee15b5 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9c3f9d8be9555233fa0b06abf8a8b49c73090eb --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df03e28f8d1a113dc1adfccf3ea06355eb3dc4496c459c6cb66e11e393b140a3 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_50_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_50_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45f9e5e124a96d28a73c90e894507784eee2324e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_50_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fed7796742a4a0b88227490242c46cbef9f6805048e17fc9cf66cd68a93ce420 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_50_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_50_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07c298c058ad1d51a1d74e3c28943cfbf89a6efe --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_50_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7593306f73f7a106a765b920475206ccd0497cf49fd3f74d0fe2e38f4cbf416 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64271af4347a418b6768a5a5b5b8e98e485389c0 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b58b1123638029822840d5acae3fd92d3d8704877191fdb92a03d3d017fde48 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..784214988b7bf6ece9c89086663b0180a30786a4 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:180525f3be517d46657af3c22574079384ab4fd36abd1bca968c1af875a84ee1 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_51_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_51_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf73d719ba3c33acbc8d9aa87eb2d3912f63c9d4 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_51_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ea231f6ec0ad8fb25e43427c6669ecafbed6d8bbf3e10430c0dc0ead144f001 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_51_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_51_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0abb16bc285b2a40ab00aa43b23d90ec96eb7011 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_51_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26e06326a1a3d5338cc0fca043db6dc6a822e685a5f14a1acbfa1ece96e50a74 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff92ed561d695ce7afa2a6aa6009638a444baf87 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:783fa9eff565fa7dbeea72e7c79975a58ccc56279b54aa3db05380bc5137b223 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..602efdf5dd0ce31c34acc0dea9519fc2cabd54ab --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66864e089047d7d94b76401b3fe8659e2e1b1587526840f8d6e3e34d3e604434 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_52_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_52_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e07c4aa5c29bb19e4b5ae9c7dcd3737621ad8b4 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_52_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb3f315fad824a34e7282916a4d4dde39b6693246e212f01b40de2e3ae356aca +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_52_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_52_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7eb56aa49af3bee8e8b903743eeaba51251518f7 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_52_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c84d86a463b18d057bb1f426a47eefaa231d2803cf912fbe2dbc6d922bedba22 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68ec025e9a8e8a5f8210962a2e3452548b479d61 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68b7b948e13527925880c382950b65a0338942e7fcb02baf2471c8da8acadf81 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..166363845cfa6f7b19e7622a3b723ce52b8dea6d --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c76f7dbde96cb6498fd48de8776664d1d7335b08f2603a1f9c67be8270d7865 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_53_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_53_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05c2d412d9a5399acb53f71a383fd32dca537579 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_53_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ad8d47f01881116de1be62817aa8c96f394fd8f148427650bcb9056717c73ef +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_53_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_53_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a06a10e4383dc16a105873ceb3c79e82ad31fc5c --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_53_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ba23140c0ac4c50537f994d7549541a1307e00724e38abdc09b6f8eabc15de1 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc21dfb0b9fe0df0f2b7d0137f9ef91e4c7f9cd1 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0381b9045ca98a1964edeb7c5ec62a77794d7df0ec510692c432bf7751639bf +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eaf015d62acde7a118220815e470df3ff3c64a84 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b4115c656901bc38e29346698ded00eab356edc611ad34b178857ea1a1253dd +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_54_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_54_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8d703c1bf120cb057f81bf3ac7fd5e959dc4bc0 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_54_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b1708f1b57162327e3fdbea2a53942b5dafd5d631ccdb6f95a157fbec2b21bd +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_54_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_54_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71625279ccab8e3699141bf0676cdbcce7b6a665 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_54_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:545b440fcd8622d115632a5479c9d38047e3724247ea5f75f251d7042ebd4171 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3983734b13dc51d6779f820e46ec2bb07364112d --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b1e7377d46e7462d68b41fc35bd9fce4ce661ae4f7906028a5a1862ca601e7b +size 208731298 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35ef15b67852dfd5242458bbf91ad7720e6e4c71 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce162d818352ad40828d4cbb3b4a6748fa01b3636c1d60fcb2a5c895cda7981c +size 208731298 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_55_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_55_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9be3a20269ada23990bc98c8e90269bf4eeb0a8 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_55_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73c4580b8abfb209c18725e38d5dedf4d9add422267378f4b9a3240ee50c8732 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_55_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_55_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6af86f2ebbf63afa6068fc36859d605e7b12e961 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_55_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9700405c7d5a94677daca377bcd50298aaeb4205adeed2d7cf911bc2f0e1e248 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a628c5a90b03f4b81bc153b4998e2a2622e9ff8 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b47ecf07e0ab3daa03e52120c44695351cc2f4375a616b5556282b470e1828a +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42191cee02fe34ff0fedd8fc7a33131d38080ce0 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:689f0406e673a59ccac1c5ae26755acf17509a7dc44c7ce728860779573e741f +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_56_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_56_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f25a6e26ae4eed6634404f429026099f07dc970 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_56_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b849fc90d7c6eab3d18ed962d1f1ec75230a65934667b722c6f8a7d6386e0c87 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_56_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_56_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19c8a232c71db00f5db194d4fd92366ae413fdda --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_56_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98d71746f70d8db5a7a2ac053fc56293ca7ebe0582ddd8fec3700e345b2944c7 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8d97c34bd33e2c6db4ff97d1513627b3c027c86 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be703b0b274599dda856f49f940843a785582a6ce31abb47feb2528781af044c +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfd77239a909f1385df682ff34f786269a098f43 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42b0674b97244cd30dad8a737c64a6bdd1ae80f20c6a07bed3bd507c763d943a +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_57_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_57_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..886f8583680b2709e892608b32dcdd25df9261af --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_57_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0371dc75b9ce23068f807b4d9637396fcde6a5a401a1386428477198e733663 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_57_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_57_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9a379da1be669404b074a659decf4e6341b5686 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_57_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44296c85df2ac15caea30520a20f63e7f76c11c40443e119396ba6ebf6a2e536 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2debb1faff55ca49565532dcde92aa5c19bef992 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ab9e1ba497e303d018ee2eaeae8f31637639fa8ea00ec3c012be796a389cde0 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96dce9117d5ba3cb081084ecde6416b165dcfee5 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8e35e41c7c21f6b4d11d016f1b59440a95a6f18e13649a21a31013b78ec200b +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_58_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_58_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f55b47247403dc654a438dc29e056f22d1287bd9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_58_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6240e162bfd3d851419011fa266df9c98c9ad9abdaed1d6ace9e75f4ac076589 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_58_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_58_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9c3f7ccd9b4bce1fc92d2ef4e4a21d4fc53635e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_58_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f558166dcb3d5f320a4a1217c34dfe1393bd5477490437a69d721f4215e0e95 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da5457e38ca96d36c0ca4c525d74da760fd849d9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5c9c7fbdb49914ef38d8691539d61eaf4906879d6e21a8e272924775f4e696b +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a28486f12ca012fc5fdfa7637bc7ad4e42f21265 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7de88d03462c60ea4c8946c2e73f6547fe947d6220442f17e4762d655229f14 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_59_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_59_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5bf6877bf9332d24079d3a75c74c9c8169528f8 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_59_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5be8adb9d0da08318f090accc1d3cadf014bfe5fe39e63a5a1e714c6134637 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_59_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_59_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c86fd8a31dd9633b354080bba535a5c2f4049e5 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_59_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdb195754db7e56ec604ed06e5ecbe4a98e90d09470a911445165c7209ba0924 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f50a4e61c1c97031b11fed460cb37d4f80bb16eb --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc80f1da9127c8df20f734aabe7a92f6f38498c9046517e0ea0124883ef6dc28 +size 208731351 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32d990f54f77fec5a2185fb53a2eede6435c463f --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a61d80f9c8069e162432733f849da1a16c802fae98de8a2a571c223edc29f4d +size 208731351 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c06879dd08da38dfd31d7d08fe4d7cd025c429a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54af829ea9e09b194a895309fce548d7ed5b3b17afd89d4e7957d0b55940ea90 +size 208732119 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a2c3f515cec17a955f5efa9834b8ef0355e9bd0 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8446aecb8ef5a20f05c2fab0155a4f7a770cddccdf0251a21c90d7f6b96fe88 +size 208732119 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ef05038735434a49e8c5e53eb2ab7707582376b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e561c983725a7ecaf865847fbbc9c8e47c6121c6c0f220fff44930593a36f74 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1fd129aae8a69741398a2b82b5231cf3fcefea7 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b95b91894dc01ac2a72c7b1503195fdaccca26376b85c3906fff0c5a47e4c9eb +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_60_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_60_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1683b30d3304a93e95cab0c6d35232e3bc93267c --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_60_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6100c224b624587436969d9e4c6f63baad0f0482a4afffecb6c2486ecbdc7eaf +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_60_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_60_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..daf2ab846c27bfb7eb9372880b9129c8a46482ee --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_60_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c210514a47f0ea87efa6163b123850297cf2c4ef7c1ed64a590ccc72651a81c1 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d40d258727d34cc1b26af2819584435500258b58 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2690ca630636dce528e12fdd77b1516fab4809bc43de41b8ac3a57b86ee5dbdf +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9725378be37c9c6aa421850c22cb3f48cd530bff --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c8f34880298d9a9bca3e269e1e51c021a7bd8d67c551ef26126e4cb69cc7a6a +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_61_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_61_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c87d8584da546971ef1e852b28a87039463158e8 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_61_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b0d278621bac9da4721420d50213145f0b3887994610310bbeb06d376a6fe7d +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_61_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_61_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a72116659cc3cf323b2e11940b0291b66e6a012 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_61_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da6d9d950a174f4bd3ac375c9b33faece6257fd66f126185b4a2b9cbb834c5f6 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..811a85c88e57c8f213dc81ae3bd18ade5193fc7a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d965cbeb708676bfb102f101b56648f6fc7482a32782339beece0de4433ecbdb +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b49daa320466bbe8c8292c54a353c6f18e3b77e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9870595909d64916157d15b2d7e3072750af756e85e9dbc674a5fa97c5b5b0ee +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_62_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_62_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c14ad5121422de0e78fc6acbf28a0162ef728c3 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_62_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d33edfbf692962287ee73f06bdc3272eb019ddc3f922f7e244672cb252285591 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_62_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_62_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..138a766a10e982bb5b5bae32220c8e9f31cc8ff8 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_62_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4db8b3d6409b373239c56512ccf38ece5879b2dbd5900b33046ccef8e299ed2a +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eea2a7940d728ec4cfb7f3dc4552118c32b8aeb5 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0929ffc6a8aae071c5b01c3fe1d730bb194e88831bc2523b3b98f801993409b4 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7fefc3c99fb28d9f4367e73e77bda5459a21a9e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f83a6f2efb9e3dd71151c9c56318aed881ed158bea85da49b542a78b56ce3203 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_63_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_63_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..424f8d3868f0df305d7eead83315693a1de109be --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_63_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a464d49a16d87c7f2ab352feed9f112b6bfe6a76655dad3f05a4ad86e72fd27 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_63_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_63_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41c7207c591745d5ccf6f0e06e06e69408b68e50 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_63_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f72c2df3963e0f78a421d9b5eae99df7483822cc54d8c28422cc535bf3d5428 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fce44f573c585c983e8ad0bb8d0e6460beb6aec9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeabb822e035ef30d1135ba14fb5c96c190bfbff72e82ca560e8b2e5df19f5e6 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30600fe2f7641694a227b1854d7eb8ae5fb9ef59 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97677f3174fb3542b900fe86276066a1982bdba03b2995276c71f9af023e4cba +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_64_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_64_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb16f920375c7ce7f6619005cf11694ba1ccc0f3 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_64_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16ce671384a4a88051e2876cc2168c14d09cc722a79122c320dc371e5d276a50 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_64_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_64_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4816527f28cc1aa180a14e0856093c4e888b21ca --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_64_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ae63dad966cc32deb552474b23e4c8d343c2d403308f311d81eef811838547a +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a769a758808b362afc8e4f6a58f2fa092ec09f5e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2180ffa95f0466135200f352107af71002ea66e6674a33fe4c2bbc425248aa24 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41b6fdd9ca5bccf8f3886b0aade700f589178a85 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaa2dba0bd730171a059b8f3eb537c8d6547d83d1b33d4f29aa3450c0d8b2e9b +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_65_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_65_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f8a391424bcf50ae1ff3a929a678e35f51f3b2d --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_65_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f36c0aa98e67a775bef8d08ec3329491df5d550e136fd24a09f03a6483ea180e +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_65_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_65_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..122cd53571e72aae0c66735efc74baa7a7d6caed --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_65_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ac8928fec5f494eb48fedcee575a2fca5b7c1b31ef5e9114afba0f0d8b57494 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90504e09af6d8b83d2988f553b2e467be3b8d1b8 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b53f23eb96619d9bc44ac1f703dd336b7b1f56e63f99a02e4e4f6e64a592036e +size 208731298 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee34eb336efe6187e328119a329e2535105fc633 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08dbae6c601d631fbf10834ddbbbe72a9b172934479720edd6e2b37dbd6dd272 +size 208731298 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_66_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_66_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76f7d861f9bb7d095fbf79ca7fd34ca345943f55 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_66_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bed3fbca5c8e99a601171d990a3373c7b02664eb5807ac8fc69d80d8591156a +size 208732066 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_66_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_66_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cab66e864ef25b01f9c506e41e3f470937eaef23 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_66_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81865a454546cd8bde24537fb8e30695c2ca0f9095613f574c98eacec9a253d3 +size 208732066 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..708d4c93650166705846997c4aa4aee3957523b6 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd17b8ab0b7569a8a437bbde63eb013296074d753fb4f5674b172292c6f9a799 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cdb2a3778a412dbf01d60964511599334c26744 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0505e05dd428a05d5945a862a9be7b7309b4ce89b91ae8645e90dcf8640514b +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_67_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_67_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..776a9bdb1922bca2a3ab445aba093da6200e1c29 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_67_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e85e4c747a58d29a6b918862908ad14b95bdeb9d9d52403333129021c0f3eb7 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_67_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_67_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..565de230f9e6b380e03fd0339ff0e9cacf570ae5 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_67_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe1f6366605491779f2589dc4b8bed865498229bc495273948b7586e6b0d78dc +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a08009f2ab79157e32a28abdf1dae4a1a9f2389b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0127e6d12c7289a5de3ed3101a42ef692b7516a0f2c3f4fd7888249ba04c9e0d +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a37a7af5050aedfe70bef6f380f11f810b406cd --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b374577e7ac4e01948bf5cf9e75530f191c88c65fa4968b206641b95ae17aaa0 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_68_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_68_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe0db51023376282b08f30b3f7ec596d45b62709 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_68_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82d54c4b7b72307cb32ae22fd2c7fbfc084d90acd512d55f3d6cf089a3723e41 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_68_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_68_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7713f4788fe82ae9cd860dff3474fa875668b39b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_68_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c748475a7aeef9993ce12e2fc6692d714eeaaa2c95a04e2041f2557ae508ff7 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..070fca08b523bd6a6b1788cb51ecc6d69fad31a1 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45f7a5633d79e149070e2d81989307e1b7bd3aa1db17a23421fbc64d3afc0a7e +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e63a82769b0d6d6734391b48d2e50082560b6bc --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff901f5949b6988388dbedc2f885553e02851848b24747a04540bd52cdaa7531 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_69_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_69_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24dd6d04c00f35c63b7ef24e4ec1adfedd2e281c --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_69_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87a09299c2de7e63f9e355f7ba7c495d6d09e649e2331014803e2cdd5e95b9be +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_69_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_69_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bd2f3b08489c18a45c7c3d7835f713682088e5f --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_69_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f661bb0087dee05b98c1c55b11df40d6b6b0503e7cd20a49f8fad651bafaf3b5 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c4ea72b5cd723b44ffec5c8d98eac579ab8f674 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab6893eb834da2c649d3990f648a9e3d2625cc4f12adb55aff25865cd86c1e25 +size 208731351 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0c06e633c7b41c1258365d20a4012486f79dffb --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0109b864a9440d9a7ad651cac5dbde4c72b0fe115cb875540f3dd3624f75ecb6 +size 208731351 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e453a648c5af5a690025c3b724dcd89cd443749e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:896247e130609220e6f731ca63e32eb62a403b5cd6767b2b00753ffedb2de7eb +size 208732119 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bad80901eb546d6b85d54cb805bf87a341aca536 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51ea4297490829c4e29902ee1d65d5f05271470baba8e886e37243ab9d0a0ccc +size 208732119 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d10e5a8966819d998b7d70f75b1fe696be9ca5b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c71ff2c0193be5d7b5ecaf8aec0f66e23e3f5ad861a921fc20e639afc196b9f8 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ce45008ae37ea68393b505854ef4241caf51368 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90a61a5125f220bb78fad5615b19d63f156f0f89f947f7dc5f3a8dd45d4d96e7 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_70_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_70_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12e401d60dd41d6bf19b866bb69736913db8891d --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_70_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8e1eb713b44106bf3d43aa5c4f149f223ceff24b02fd319ea243c6d0eb84aaa +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_70_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_70_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da836db754dbda0c82689e7f02cf5808b619c69c --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_70_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41556f9bd93fbac8e1650a719766159b43cdd6042a19875045c9af45e29b9d02 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bec5539586e459754d5d3b0eeaf97b12f9444acf --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b470205fc455e074b23363aa40a63d0a1948eb5b31adfddd12972680b083f4b +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4b68ed5679730170968680caf2a0a0ae490ae40 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d9fc9310bb9abf08bdb40d444a58a4c7647a266f9174ef9b3ec76cbddbf17d8 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_71_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_71_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..540b77e632749cefc39eadb303b7b67c02bb16b7 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_71_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3026035b0d7db0f39ddd0be8791e6b4199eb1c269a599c274da086221fc7230 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_71_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_71_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15b79ed5dc4a958d08df97fe9ff1cdb8adffec86 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_71_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80061d99e567c9b82963a6144a2347077e9fc791c74333784d58ec6fab04b178 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11ae7c901240ab95003bd77c640d3de2e553749b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86245f5da8447b18c49898b36bb1230ac5dccaec7abf774623cfb061cc99d52e +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..429d2a630199f77d0b3ebe5d1b3c03a58dded0cc --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5901b42c85056a6ddd08b03ed8c4be882276ac568853441b1ff4da56cbdcefb7 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_72_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_72_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd9fa65c30f88095452e73b4470c56e5a7806b1e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_72_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ddd674f55f93b6fc2ee560384e68676f10459c66e6ace491a39a0e54f880d73 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_72_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_72_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..518db85419f8e90f5f723ec0b1bbd8e2910cbaa3 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_72_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae3d6d917c02bc5341d677a2c2aac4a4a5a8ec25a682264da5e03731a41ff4b5 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..849ed20887e8033ccc0eaf9b3b1d79ce58bc34ff --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b8d05b9511008230ed2613a18bf8b05f2607e6d7bd03d5b1b84d81973ed96d4 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6afbec9db2af9e4f692522e82a92544a6831a288 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:071d77660265bd7855573345200d333bd4be5eb6c5d29e0ab596ba01d4f14bec +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_73_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_73_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff093a3f31554851da21f5a6aa6013b2e043a76a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_73_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cc4e412c8db600b66e4423b8dfc8b63ebaba4ec8831a5d24f236276c0ec25f6 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_73_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_73_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c51f0b8f84e9d1d547d1be89508c971aa401d288 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_73_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b09be2721b1cab5a63431d51c6a18fbf438aa1c283ea07453d7c77d942a730e +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92d1f094efc6a2bb8361b5d169cc46813d2823f0 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e975dd7ea56e6a7a3ead2207d87ba5311ff2e13a0205034678b3c43b438ebe72 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8942788c87510a81725cfdcb047fa9088dbfe70 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ad9e64851320688d86600fb0d5485e67e5fb5310f7fcbde60347fdf5ce07283 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_74_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_74_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..823158df517c5104527642941ff5b939b3dee4f1 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_74_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85f050f67175cbf06e099f7608666574a1fe236e71c820e894ee0f9873f9b071 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_74_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_74_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64685d32e6d21a51fa06236fc0c3d3c6f40aac88 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_74_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bd2275f5edb026ee0b49329cef8447ad4338c1c70a56081e8392230da6a8ebd +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20538697343cb4624e0beea559c2c901e2410bec --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4079a456b9251f1741adb6e8e81d489f1f8801f791070281f0ad182954426e64 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c772dcd948d74f32479d377d375a89b65d7aeb87 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88f3535a42c5b472a1949f376ee34593b29718f285b1ab2faef708a8a855fbdf +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_75_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_75_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76ce69fec91558f7ec0bf789317a62b7630e36c6 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_75_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2764e7c16949259f7c5b61823c499ed1a2c09de2bc2e3f6611d8148f94031c5b +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_75_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_75_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e5ab182a1e85b5ef2c9d12116b6f311b733c7b9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_75_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbb2a03352fd421d1a79dcf7ad15322f9734d795e8cf11447c36baaafcb27ee6 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1074ec8512a01717644ba022c86fda9199e0e3e6 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee5aadc6730456a02589010edfa33e3db1a7d8ee047787b16b93b92f24068dbf +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b126b67aa7e6048d7bf280107ea72a64a5c7574d --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c584fe7cd891f4ed441a010d51f1f94d925a3e2ea1b4a255a6e2374620883784 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_76_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_76_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4109c74ba041e2513e7ac72dbecf156bdaa45a6e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_76_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0cf245f925328679d29d93d01e407c7a317a1fba77d59b19620aaca09f29bb3 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_76_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_76_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56bf98fba4c1882800545e151313df7f0d9394e0 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_76_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68283a91c4659f0fec2584ebfd6412e40f6dde17511185cd3a98fbee35929ddd +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..406a334c2f5283953eeda15274c112c015f9f075 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ff28ed64679a43c910d3c4f2d1cd7a1b1eb30ddd6eb46ae06e736006d6c1d52 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74c8329a1151c8ea0ebd9b4454c279f5607f6778 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18f2c46c470189c68255bcdf44064e7d5e43d37883e38ac61ddaaf7a659844d2 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_77_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_77_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d78e612e18fef8e33494d1300b3e33806320859 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_77_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05202e9cbf049273dafc75d74d650a43f841b2b01d0f9881abf0d63d2b4ee8d2 +size 208732066 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_77_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_77_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a0b7d78d9914ea85e2b4d9cf4585bf512fbb566 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_77_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c35a84073a3d47e5369d5243c33a70c99ad1fd6a05f9cda8398a2c6721cd968 +size 208732066 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd8eba9d34d64e4fe3bc30013dd36a686a039089 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1f445c4a4bb246e4eb626723f048b6b19eb4c519a7c07f3e22a1794a260da82 +size 208731298 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..784c07f0b4b762fbc8ee43690a1631efe495398f --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:199c8071f862df62bbac9fecb3071a3f3b1e0a50279432a20d3afa9cf4520c52 +size 208731298 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_78_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_78_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24b43ec8c45b02e0e698d16a2c75dcfdb639d45f --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_78_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b827f7fe057a2df2b8960ecbafeb7d4af9765b3378b1cb81cdc19ff6f4f84656 +size 208732066 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_78_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_78_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0bb4975eada8d521bce61e61d5392230b0e2da0 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_78_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f19b11a64cff21b8597a586e93bd189e91a97ff44d2ad5e465b9850ddea4f1 +size 208732066 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..816c11e16a7518d30014859efa5afaaedec93bf3 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88218fb95ac17e1df3200f9673d7e53a05986c94cbdc3cad65d5c55039e1d41d +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fc85ca1864c333f551e6763a2171ffa468a1128 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73ddfef29f0f72727eb3d16172d3c704ce5a3d715e55e385496d348bda8fbc27 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_79_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_79_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f39eeeab3e28fafbbed9ecc35ec764149a1ee93 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_79_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:353fae816263f2d2c4b512dc5a0a121f76b8d086d0566db4c02cbde4f6eebd80 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_79_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_79_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7a5aa83a9baa18bc605b9c7c86fbe05dbfbf2b6 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_79_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:177e4e2b7b66c2075fd95fa4f3cd5c3909bb027e1bfbbe1e3353fe38e80b93cd +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..704972c4375a38b8c118a78093e1243d9ee70895 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca54c3e007f560bea2b0a70a85b099ce8afc0e40bf6a12e0b5c8e183638423c3 +size 208731351 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e38415bfb2c55e179a812f28191cbf9a6f9ca0eb --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ed36de1a611b4c19e112ccbe8a0675950e3312501ba1e8c0dc388b48d92abcc +size 208731351 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f4bb8119075b15ebf68fbf04122788c274e5128 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f889dfde3b837039d224b235f87f162eb762281eb971e1353454dc8090827c0 +size 208732119 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46c0a4add4866432bd023d8edcfb502c704e3d68 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2d222acd175757778d3eecd578c0a1f24c1b7cc8fb2b8917e635e77d2973b56 +size 208732119 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..296277d134b290fc5e45489da6d196a48cc33f7f --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07274c1492983778a56067d7a6eb8437765e98573c5c53d8a0a36328be44179b +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a632d5245a2058ec79e3fbd1a39f591d597075d5 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7e77ef15403481bb8ce9d5ae7ae82fb742d8c3a2d524ab97dcce3947cf50285 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_80_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_80_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a3f0ce712bf68b039dfad0890ce24c234dee226 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_80_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8815d0bd2faefc58a9a86e97566116a8e690e0d5a33da2f1a745d7f99191d9d +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_80_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_80_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7378d2651014e597b6ca2d1c7b1f8371628f105 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_80_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a887661d863a455ee48eb11facaade64096e680919bd9dea7debc2c68487d17 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4eb98a5336ecd974bbdfbd61d493c4094580db13 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e35bd27e23e2b1f9ac2f69c2afe85bab13794263e8deda649673274aa6defe3 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8467adef16e3835356e36cfed0fb072cef90d299 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:019a05f99c35d57a1e23a2c4a102875bf27b553f9ebd6a434ef5c9f049beb64d +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_81_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_81_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0907c9a91630a5df8508620bf8135a9fcdbacc22 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_81_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63e1ec3031ab88242b0f952c63c7040cc387e8a5ddef6ffc40ab4c715b1d45bf +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_81_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_81_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0901cbdacd46e099f89f728d029323331e9411a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_81_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c2b53c97b5da27eb9359509854ae5ad3cb9b005c73d53ffd60660ceb9fb474c +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..499c82d1f2c148fb8a1084a48730960e8a01d7ed --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79b9e1aaaf4fc31d3cd33f538105196fe2850c8e35e9a8af6d5d7fbcd990ae10 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f518f3ed10125cabb82ccf7324cc22ef61476c47 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f12693600b62a759c53d70277a0143884748f645a84fd630c5a9724ef87758c2 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_82_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_82_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f21b3d2653ec79cf485916c84a970f9f887da6b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_82_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d4fa187db9c25baa3cfe6ab657ce22c37a2229269d931bcf0aad83ca3af80c7 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_82_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_82_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..026bf422f15335a2f2f5ae96b0e42491d2508bba --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_82_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eae98d0981092e585669f11580df0ccb2604ada82fe54c98f09a7d5e473cba46 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..292e4cc8b554721a0113b75e5df64f3a017afd29 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c459aa0f2ab3e32b0f4862b773d18d8f6a7f02aa406898539cace55c2d0d10a +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05abffd22ad7aae12edb9550d17b192184424161 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eecf836ceb61c87239ac6b045463825af19bce4464e7c631c5aad2526873899d +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_83_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_83_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c8c3a00bce13a754214131c18d6413413358b1e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_83_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a2c3bf759c540da21fb82484163a82bf4d265aa73282e607168674aee26cf74 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_83_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_83_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ea1582f3b659884adba348d5518a799c76f6402 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_83_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5654d402bec30befa87b94329d09cb0534daa0c7b35b45520899c218b93b0587 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08f53c0f346ff315f7fcf601a33689f939717823 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a075edef7965cfa92268bccc0e7e9fa62050231048667b356aa115ea22644a61 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f362a989912c5d50746ff3b32f35a657b2db413 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3cf1d4703876a519f95b5c6a7032b41799743b94402cd9618f4c4959c2f7989 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_84_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_84_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b10b9348fe7c7e1401c0ca5dcb621dfbc61ebade --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_84_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:686becdd0aae8f297630d40a6b90b7e85be699d2501261ba8ebef94561d0b7ef +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_84_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_84_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4b3111e8b9e62e2d6640fcdcc3c77f0d5f029c9 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_84_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc554d801d45d9f2fd08c8a57888d9d28a97e2e44ccd03a4eee1dc5c3a900cb8 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc2bc87d4a9468645aa5cad82a3f81e5d2745ae0 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90cbb5951bfbd0e89635e48fa220ab1b524bec6578dc4715583c8b55e68f44eb +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3de2967ac81fafe5040a95323d373f08efa4831 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e75fbcecfac5539b666a0df4ea5349d613dc8ef776a395e4d03754957bcd15e +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_85_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_85_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3885e3170a6a43e5862db42f91e2f7990eba4f6 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_85_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44da3c18db1a92bc848d1dd50a4282e8485c6f9be052ec1aef8cb2e7bb69bea9 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_85_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_85_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d50eabda83572017e0f9745d1c471dbff7415d8 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_85_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bfe965db1531f1aec433f063c10cf001be620eba97fdfe8ae6f06d4f5af1376 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8707aa43136378f404d6f1bb05c44057c9add84 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e49454b310020908e8b440abc8f1983c4cb82dd0206b2ea9edf08e3ce4791467 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21560fef0caa05488d88d44532d425e0d3d50079 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d73d8962e73ae250537a0eb403ecae636410e44b62ced8364f1eec4f02d80ae +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_86_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_86_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa16ec5250d701d1c9124710ca4d1e03425f69dc --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_86_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cb0595dba0f5eada834d1a893169be56302ea5293e422c3ffb2a686df7dd6ae +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_86_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_86_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb359ff27f72acb7fefed99e716412044ee0429a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_86_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d9fc45a611630d15b1a5a07618798e31afeb57e2bea8011196e0b8336fa8599 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f0ac0f9e962fe7fba1c02f319d31a3bc052dd31 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9936cc17d174672a124eea16f7d6eeb61dd8d974dd72c103ec97797fada8cbb9 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e02bac07284f548db13ff6050c8421c71ed9ba35 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5010379c76a73105fe266307bcd9a117d92d42c8351503a1def5ced2dc4694f2 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_87_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_87_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18d243c9cfc2cec62b78c637ea72a7d2c2b48157 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_87_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff5021f8d7c9c6afda82e145a448549e04736fca4f7eb0b998bf4baf91e10c92 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_87_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_87_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..105e45edf9877058e390d3707721626de1d9103d --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_87_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f3eefc00057621d4fb339bd474b886faf6e96256c7eeab0ac19dd98bdfaeecd +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..846753f7210e505af18d2bac9383c33920216c69 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9e108d467b3caa82fe473f741471b919791703753e9e569015cf2ae8da14e57 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0683fef9b1bb34d1a15696bad17e76d3add28b4c --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54d22a59d2cf6ae8627ed48fa96124ce47fe962b21b551acaba78fa8784049a9 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_88_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_88_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..efbc2a67432d480b170202681b105cc2e67dfc1c --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_88_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49c164c28f34598d4bfb80032d81c32c708a57828711097292fff124ec01fd78 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_88_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_88_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43d1525024865be63148d727644bb855aaedf4b7 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_88_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b56cdb30ebdf7eafd5206e8de8088471d0cf9584f25a39d0588465063573038e +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b9fa3b8899193805def438ac251dfb82db8b194 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20955f448e6b49ef33d2d7ce6ec894f2eeb314691b23b151bd8c0a4ec2d9e682 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e09bb76129bc40072f9a1a888270ac58feeeeb36 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98937a32c049edfca19ff863fdee4546aabd1ad9b02d7fc78f5f3a2ae574a9b9 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_89_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_89_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12b2d5fa28aabd4c9e88fd125fd369d2c824f98a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_89_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77a90dab3443278091cd3f48eb1bf4b1056eecd52af10c3bbbda05fdfac6e509 +size 208732066 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_89_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_89_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97d9a1f8973e23831fdb583515b39ee0f14517fb --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_89_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e0efb9c7e71c7692826babb048c984e5b76e514c7166ca21be76a3ea696ffe3 +size 208732066 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63dabaf0691bc78532c27ca25fd15b50d07e6e47 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e276f766010dbe606a9b7eef9ab618b4a917e57eb108b3f885b90c0105ff975 +size 208731479 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1655b41072dfc8afe1ed537492d3185464ad72d --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c34fa58841b6b0ced8c4dd42d1d5f4f132000001a2525c1dd36223d334c0412 +size 208731479 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2149d54e7460710e13cce0818c2609d420c39173 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5f7e0591ab613281118c6409a71f92a415cfc733a262255dd98a1aa1d87cd10 +size 208732247 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b95d8ac91a26456d85a85af9fb7f16ce5dd42ec4 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79055fb9f2ae9602fd32be738cf8cf0e8a699e63d1d7bcaab6a9721cffebe8ed +size 208732247 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cca20df4838af393e49320d669be25bd5171f2d4 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f400ab53a6808f23014dae4abf2b73aef1961778a1eb60a49740832e3a73b07d +size 208731298 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e7f5f010df8d4232b7a4bf8d2182289a6e79ba8 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6799e83fe5bf64b1220875ebfe599c9497fbeec20ab5e1eb2955183bc21caba5 +size 208731298 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_90_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_90_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0e827c98d82e6bf02a6cd2caa7935e73af1530a --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_90_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cbe0ac226e3f86044a7eea0a4035f662905272b6ed10b80971acb732f114df1 +size 208732066 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_90_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_90_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae96b0c5849ac6153d924eb90c6ef08fe80a9c53 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_90_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:888f28be5f1eb6fd9f9ce407fee47bec086222220b846d505c6ed16940157765 +size 208732066 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8a517d71bdbe58cbc73c201d55a54b919199743 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c106bde3c1ceb29bd48e29dc3896d12f838d61660cf76cece0ed4bddce658b60 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af37b2caea55b2b3bd6acbeef73648d90271e8ca --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca0d24080cc01079b72c8253b596cdf96a8226f67c78c02d8d7c303c659ac4f7 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_91_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_91_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57080b4992aa8f488d6eca69f700345962613c89 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_91_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7d77bb5a30372c2792c164d103bcd1077d19b7f0f06b8b5798bc51a9a02b7e0 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_91_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_91_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d02129bcdd2dcc52a49d98902c3af6227ff7a3e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_91_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee5a58281f5d8252b461eeb594464a30a7c6f02f2384419377003580b0781537 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4078cefecafc2332dbf241623bd07ad1802fde09 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:447e4b8032b1c0db1c18eae355fa00eb2525939d21f47c3bab66afd0403a6381 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cfee982a854fb1095f9acbe8abf3700e03a79ad --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e765cba0ef2ec2d23784186d71c8100f2f80a64b03c317c32b31453739bf49b5 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_92_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_92_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..893ad48163af1c2b5946cf10f954fc5af9b000bb --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_92_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09b1f8b5e9d1a954e93d7e2243420fafdd8caf202e2c5050c16313d0d3df6720 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_92_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_92_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f78528636ab9f9c806ce99d8869821c436c1cdf --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_92_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1058ea3a53ee88479d7a3d59ef3e69f8dc36d2f4d6b474f206de28435acb26f +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08569e84d96f585b602a3c7646d8f9870949bfc1 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a17e20070bd977ae8d048db6f719e6cd9d574bc6ee056ecb8a534859397285c5 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3bc17c533c97fec38e21fbc31febc68ba923ec2 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b39a2e1571412fae5b3a0582f51fc0b02533c8273736796ed09e6910c3ba14b6 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_93_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_93_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd0df358c3830cab93ddd14b317db0e9bdd7d695 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_93_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5010a2eb34790587c8af0edfc486beeceb704f6ec24bdeacf5048b334486438 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_93_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_93_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6506a0363e61981e96b161ae14e165f686154d27 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_93_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:628c695d1f4223ffec82dd2472f1e8444f5ac8420233be843022f2cce3abb47b +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ea788fba64008be7a0474509b91172b5852ab3 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5575b17b966fea77c36783d2645e8c4bb023c0c6a4f92994b93d75cad6ec48ad +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce3e484c293a6946b48244b65def21cb9eeab8eb --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:428f458ced1e759605e629200e2d54d87ef366e9a5c6ec1d59c9c55c51aba738 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_94_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_94_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48295f80b188235ba94441f3f6641a9c82a6cd14 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_94_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:152284a6c4b3902b132909b8102099dc08c8a4e38e1509dafbee4b715d6ceb9f +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_94_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_94_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb5d7b6e630577efa618771b3b835e5d779463d0 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_94_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba7a2a8fcf02ea97985e99d9730746863a092cd078b96ee2a2d631aab65fb4e8 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..008eefb5e440405dec4a92da91625a5162afbb94 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4275a622b08b0cc8b13a5a20b1c0bfd9f522f42e2a2bc4da87c54f6a6ead7f41 +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7cfbf61baf2418fb878702e6ccb0699061a8674 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c74e933f13991473ca3ecfb5207085e254ffb4d6bbad0500885a6e3cdc1232cd +size 208731490 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_95_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_95_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be6701cfc05638f9b8fc60113e1ad4226b1f3c36 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_95_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51170db4669aaecd7a59cab2426f395bf6bae60cfdccd74a2782af1726f18aa3 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_95_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_95_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b832611be3d85c89991aa97a8544342aae5036b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_95_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:238d7a5e128983bf5f19f02229b917484169dbb4e5dbf029ae4113d822240cb0 +size 208732258 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5bea15b451464dc854dd259beeb6156d799e097 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ae4038cf14207023ac2f75dad79ebbf2e5fdc4dc5fda0ed247feb7a7bdae8cd +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e0fa3ff50b705169f5ab981995b2d8c78cdfe5c --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7d9321bfdf0d9df215db6ab1eb2b8aa89a2b14f53195af26ad37f8b53517f1f +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_96_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_96_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b75d45a86b56770ebcc2da95c4e9288ba6c7a7d3 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_96_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97967173fb5a90d8fd7673450077849df0534974208bb3ee35faac40a302844f +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_96_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_96_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5002939874da6f728c83c0b090ce253f4d1639ba --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_96_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fff536bb1706983e72226877f295e6ba03a3dda47811633f1e2240ca8116ee1 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3503fa199231d3acda7e5ce516ecad852354d52e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56f90c846efe90882eff8d0e6f170af84b46d32d51084b2a1c60e0150e801766 +size 208731298 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d3543258141af019f72c698f48aacc1a75625d2 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b551388efbfd38603fccea85e151b2c121ca2a4b249c2fb339600830159c152 +size 208731298 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_97_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_97_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c96b3fef3789b6cce5994961dbe6a7fdf04a3eea --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_97_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:971b4ab1d6c1c5cb1583d044d1aeba14e0fae570dbc6b777a114de7d9e69bdee +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_97_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_97_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e303f1b0c419c0d2579f5a5f1627967c7671780d --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_97_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad7af8c43be187fee25e57a7ba5b24a2bb4dcf69e1f1d9d9940bba8440ef9a28 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a72f1db23422297de4a23757a044307bedd517f --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e8fa66624fb44ebf4f186d5af39cb05cb74b8c274a31ff624294bb9ea6a4d29 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30b47d5132ae15c625d86da372ca026177e0b962 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b34ab9db6764ad8f08cda094db804d9f838d92ebbd7d01d7a9d25dff76074054 +size 208731426 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_98_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_98_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e72df2290d34273a315c207b862b4939f18d06d --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_98_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52152d8b573c1a915577f2a7955046988bb04c370a3b7294431253a0b571e062 +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_98_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_98_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ccc373a64a0eeda2e5c9dc0317d9b1fcdb9423b --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_98_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab80a7ff571d1cd28101c24dd99094f5eaee067fc453205975ccbdec6532f77c +size 208732194 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ea4215029fac81522c446a9f1831490b6d00b5d --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b05bdede7b8c4aafa45d4c987c3cca1b8f0c11bfc168692591a135a8ccf0d2ff +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddd6c9079871880b73c6d2666267c86dacfea3ee --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83f062f55c5a577d5d35f43ff2a7a6c08d17af02259d071767a41446ec734270 +size 208731362 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_99_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_99_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1201dbaa24147f17b55cb6203959050e62eb04e --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_99_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:353b31bcf6061393e469c2f496d5aec853617045b53e7c7263cfb1a453477cc7 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_99_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_99_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50dce547310b03ec56ad2e1afa3440833bfa9fa2 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_99_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d5c18ac883b82efbb86f844914de8bcf06156264112b9472409f1db3e3e5df6 +size 208732130 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d87ae049cd354d71cbe4dbb03edb06eab15c60ac --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fde9df79aac26ae9a2109738801b30ae28c6ca04b5feceeb5393729d6c51b5e0 +size 208731351 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af4610e40fc92889edc5ff7fd26d575941fb72f1 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:251d28ea3dc44981c0db29cf803763e7ef4c0a2ca0f6742d0525ef31e37d13b1 +size 208731351 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab1721ae25f2f26b3416e13f4557c59991746b91 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cce1966e6b2d565bd23969bbef01ce111380606b5a8aaa70c249c94249418ea8 +size 208732119 diff --git a/8b7178b44b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt b/8b7178b44b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34e46d17dc1e46f4e3a40f2f10cc4c205ae3dec6 --- /dev/null +++ b/8b7178b44b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41f0013d48688ad9241f4d4e4a6e7444e3af56a9465219c65307ea91c8f3fd50 +size 208732119 diff --git a/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8cecfc2dcd8fe66e587031d5216495c640aa8ac --- /dev/null +++ b/8b7178b44b/global_step84877/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74601c7d9be79d3dfaa452f5a2baadbc92c54f74aa49881186ccdf88dda63374 +size 223347971 diff --git a/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73bbadf3dab2540ca078dcfbdc6d61269ba19070 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df12cc00fafa1b58a4f213214df68cc38e149364cedee343bec2aa4a4fd6b863 +size 223347971 diff --git a/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbfb76419faeea0facfb5dd8943156a705511cba --- /dev/null +++ b/8b7178b44b/global_step84877/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d820e6297236792b5328276c0b81d8cfaf17271a89ca79ca274a977d98cd0187 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba8aacafa70adc132bc8eaf31211bda937d84ae8 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a7d7679c9f4e791afd6dcafcf8788d78d06f6bf26e74563f198d1796ec717b9 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a06586fa9f94937563b3a5d5ac99168254507f4c --- /dev/null +++ b/8b7178b44b/global_step84877/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7ef13d248826519ee840b9cc8569a1d77c81a2425276435795d7985ed5b4808 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3cfd094e27e7b8f5ffaf51ca4a1131c7363e8cb --- /dev/null +++ b/8b7178b44b/global_step84877/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45187ecede335d4ff92b449077710052cbfcdbd5bc4c9497cb119e80beb1a709 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb737b344fcf5cc5b5c44f287f75061cb2be2883 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:539937ac2c5615938dacd35317c15c0db30d47057f0c9178b5f171675b975117 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..afce3bd0db6f2c09d694c0d244679adbd5294aba --- /dev/null +++ b/8b7178b44b/global_step84877/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec788af6bf6f99734bb866e90f5a690d089b71c8269aea202bb0e281382967a9 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3702e70cf0e51cd996b5e5df75b3ea8353ac639f --- /dev/null +++ b/8b7178b44b/global_step84877/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ba2ec11f12e223167c31d056e036b67cedce0772d7c912a00985eb0c69edb7d +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7a0177e3263cf6668e6ca171fc9ca5a6f096c78 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11344bd43443099d4483ef06cb18d2b210b6751c22906836df8d257e746d0417 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81a23bcd227dde302275e131057c4924b8ded200 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01ae2ea9d73ea674b25ee889402cac92ebce30880a5135c57a6629c509d7937e +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e648d80cafabd10c9b2aa98c23a8394c2a92147 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:303d252e8ff0c7a1c309c6a535cde89a3f35e7b9994a5a9fea8336160df02acd +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75e4a814ff07cd0bc4d142a71f4d47b5b17980c6 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd5c99176f9fd4236f4a80a3e525a8731783681526004855869ad258ddda41ee +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5caec18bc538885e6ba93f81cc15adcec6f68561 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e76e87fce7669bde24d7b8d6bc3b283b21db3462ed3678c2ba0b2b029f4288d6 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7fe34886c8ccb7640767b4f64c2f0286ec46327 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c59c51ff3d93aa232e7182cc017aca5feb995a93ac3442403cd7ce538ee98fec +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ddd0a2d85fb38fcb53f34c754c744b73ec1abf7 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f01ec54ecf634d3c6c0008de529e48cf997f727ef4ce44d062850209b8100c27 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdd3be07ad4e22e0be635360fc9ce95d54e191d7 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e081690b7e87983c17f863ce9177bdd9382b50a24dffe4bcdfa2f6a3bf05c04a +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..494787efada381e21c062e334b38106fc2fa054e --- /dev/null +++ b/8b7178b44b/global_step84877/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:995f236d22f77f6979e3ae55108cb3878b472856fc85e894faaf797d03ef0b47 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef4f7f7e1f590ec146ac26a3b00ac30590f8593e --- /dev/null +++ b/8b7178b44b/global_step84877/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9460dafa29976e80c077038e18614bcfa73c8f8cb45993589c862e398fc225ca +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80cfc32afdc93c6923ef056462835002505d9123 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5bf2a6bf1fb4ea0d8cf663c23bbc4af3f8f62dfec09a9a2e946c63746b610d6 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a498feb5fbd0f95b6c0a7ad9187899ddc73af233 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a16766cf65b8ca0e42d4e530c795997b84aaba58fd3052b73a894e3a2abff954 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d56de9dea8091ca544d42d4db24d631518b28750 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaaad63eaca04e70e8158016f06c7048ffb9109fe08a3e0db734a13bb8b4ddd5 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..800014047efde2cd918cf535d65aa9abaedd2c6c --- /dev/null +++ b/8b7178b44b/global_step84877/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ec34389d7319c43930e41855fe9682d063fcfc97b7807bf96bb3c97a0c134e3 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d021183d34ee0e2c0d647e3cc7c6391b6832833 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:deb20f37c7a9624fa0c83537979bc8c4ab0bd471d0d0ed78e3556094b43ab7f8 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aef13765a0d0ae9db31e1008d106884c096a8248 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:330d29cf71b9a7855a6c52ed9aa38d10fce6c462dafce4c83929dfa5ddd1bc73 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..530967cc67322f2b9fa766b7e9647210757658f1 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ace25ca84edb81c2017b5004460b1cda9c447f599aab8da41e5bbf9e76ba6d6 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef0028895697b6c9ee6bc4d29fc7171e04fa11b9 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56830c60b5c9dcc506bf92b5d74aaddacf65163a1ecb934e5786dca6e988465e +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0532fa6a04799e02cead13ded25b8eebdadbc5d2 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebcfd936bc76fe69aaba1a59d3b7b108c9c2b426f724ab6867d1a49104b7ab79 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f332fc98403ce1136a0092787d3597fc11dcaa7 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1d76ccad99890e0367f132f51dcaef072708b11840a51cc42623224550e7d33 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b77986d94a265286c234d5b899c1325db1a5cd2b --- /dev/null +++ b/8b7178b44b/global_step84877/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:873b1c1c9acea5bc1695ed18141b7da45b3812ade2e8401b3871923c857476ce +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2420bd8ea9e29ed9511851ded9345202db19f28 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab9f511f28040b3bc68ea9c253bf52d1ed2bf1f73a3623dc38cb7046865ff946 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb4b2e390a537895624d85dc04cf5cfe9fe1538c --- /dev/null +++ b/8b7178b44b/global_step84877/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19eb375298c50e58a7a288417b0f120ebc224f8873f1548a603a32867318e3fc +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..053b94abab703484405ac06735f39e62f9b76404 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f4f78dd9c72fe1507364f899814637e5c952dbaf1ae6de48dec992d4394aab3 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ff6b720abd94d516f4e51ea4ba65da872eb3ee0 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab0b35ef900be04cee57811269afab219881e8de91d602bd305f7de61293f995 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3b66aa121b727b316791adf324831950369e02a --- /dev/null +++ b/8b7178b44b/global_step84877/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e8b6044b937a0543c38a3414b345c7b68629a569d6b75446cef163ab69ad9ea +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2c8f98c7536b756325b6ed4354ef2b3410a9e81 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:216d2903c4c6036931d34d132b30bfb9ba4468604e6234716ec943a7b5e1f583 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..725b8e7255aba56eac3cdacc8b890f04248f265d --- /dev/null +++ b/8b7178b44b/global_step84877/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c4cf1ef988ada41a2de01be276c8f4183e26cf4ba66bb2fa2b0fff06c0f7e20 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c3a8714da348bf2df39042745e7549285e94b11 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8eb0ece70bc54616f9c4b943bd0fe702d01eeafcf569a0539da0929ad3306b7 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57e0f98c4ea4bc9fc3871133d88af721c6a0e75b --- /dev/null +++ b/8b7178b44b/global_step84877/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f458c66cb302f035ff0a38154e63a0be7e7304da8da90f2a82bfa7a898f3d2d6 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58e9206d4e6d2c47547db573c1f22ddb29e12a9c --- /dev/null +++ b/8b7178b44b/global_step84877/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:662eaf8138a412599f6ebe94fcbb5809e5ebe232a8026d84c902d6beea50c402 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2084644c9dae105aed862fae80b69c2f4c1727fe --- /dev/null +++ b/8b7178b44b/global_step84877/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85403dcc462f0b227b976dc9cce1b4e77645a1e47b50108639b3e755a57379eb +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bf420d67e22f7f2f539e9699c2ce80e8b765e2b --- /dev/null +++ b/8b7178b44b/global_step84877/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7380785204322b64f37c801e52da5be05a168dc89d1e4392fd9625cc3110e9ad +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f9ae839a571c716b1671c5aafd67cacc52505cc --- /dev/null +++ b/8b7178b44b/global_step84877/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af8db27062080f807e2a7130a705fee986afa7d8f6927b1f155b14a57ccb54be +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aaa9d2babe3f25d73fc9342a4e544c9cf648f841 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fae800ca198100537316bdf8a3c46802aa303cb4496f68e28021edb1fc41bc7 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cd8997ea8c1656b5489c2e7e750af82f83dc374 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:755c65e168b73e50aed3ae47febefcf1cc3411b66d2ce1b5577952fd5487979f +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f49bb29f905285889d14c44763a570ad74fc1a9 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:343075d2c094460855324e6d1fa439e3630e3e07e0267fe9143e17ede4542fd3 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed97e94ed8ea08d4067eb626501dfc3c5a42baad --- /dev/null +++ b/8b7178b44b/global_step84877/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64ac8a85e37b6a829d1fb6df20e6b7f82916498bae085dbcbd49dc4af5d9a7a9 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c88a7f05dcf7221259bb4831391f556d3fe44894 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c31bb410a8e31bcd969bc4378aa77e3476c43331832042f2720c284ab64448a +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..feeee1411db56b270de305aa62360b98f7a035d6 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acaabfc54b060b4558d75e464cedca98f5869f77f1474341c888d41611a132c7 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3aa60c26dbe5b20ccc618fe34766206264f59a87 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b16a23c4a75c89f4751b66ddc81ff2041176599628a5e7323a9d973d227727f +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1258912550b46ab4cbc63c174cd50db955f3f6d --- /dev/null +++ b/8b7178b44b/global_step84877/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:024a9d8d2bffef77e53c37d25edc54a50e79df67cb7479f1faafb203b31734a9 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3aaa91f7dbb402ed5a5df242d716dcc124c663f2 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c15ff20f6216b2facb3524384bb62bb6bd66dab4576a4f8ba4d39a2e6f1c14c6 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25cd097081408b1dcc878b1578d2e4f0c33e6a3b --- /dev/null +++ b/8b7178b44b/global_step84877/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c8f11a9f20e9f66403f12f87d2862d228ed75dd69073da38247d16544866559 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..390596b312596d1fdfe8cdea4f4d8a60e9aa18bf --- /dev/null +++ b/8b7178b44b/global_step84877/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e57b91085d90f1367803d6272707719d78277d79b00e890ded6900e7c1f5fa3 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce58fd3b2c89daad5e13bd97e0e62afeab8de205 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50a047523c6473ef4ffeeb4868887d46b4d77d87e66366301e84759feb49954f +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ccb447326ce80d557c8db6929f4861d1b077541 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ef074de44861f04b0eeb6fbee86df49a4ef0870a311af458eef58706e35c29d +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cd8f8f1f97efaf27a94ef8325345d94f6fabc23 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efad97cb8916006efd0b25ed3d79dc28f4461784ea498d566c09cf4292f87620 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78a762b9629c151a3606d9f04186aa250e08c5bf --- /dev/null +++ b/8b7178b44b/global_step84877/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:371922ba0e2e4bc2a3b891a440d300520942e2db4b975ffe7ce8925a035f7e1f +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a3b44cb587566462dbc55b54b7528b511ee8b4b --- /dev/null +++ b/8b7178b44b/global_step84877/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:948533ba2e490036439f198923cc8933c7603764358325aa9869663c092ca686 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92a1b33b0a93a441672665420a693e85a2aef536 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f82648ed6082d848cad2f41431730e332d52a25baf0d79a156a5f22c52d6bc1 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1e3a76e72b79aec2fea92871fb8f5accb33512b --- /dev/null +++ b/8b7178b44b/global_step84877/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24a998803c47bcf0da451c00283c9dc5f9f489a9d4335f80c0171059b525b520 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c570ec355fc8a0d1939acee635d8fbdd847420c2 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05dbdae9e0af26fba260ca67b61454b439774a47c26be8737aa45afeee722188 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f6de9e893dbbc40a18a007a9da888f71bc50f01 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae06339abf7088313b8bb5a90960525f98db4a797ac98889862c02550a1028bb +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e6d7300dec7f4bfb28932a2a41de3497b32fcbc --- /dev/null +++ b/8b7178b44b/global_step84877/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:884d35115f320352670b1ba20f880d56244e0c951ce31980f13d4b999bc9371a +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e851acbff81ee923fb737ab66845a1a15360a5d1 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:077e60e5910364baecdf284b73d1a719372af515d61fc4265e7a8d2e09ca6e52 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7daf9e5d597f9ec8644cce954d89b62b98c12a72 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:607ca15c68c2e2c11629a30abf337e980aa09181092ef9b933e9af4445773e3b +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a61f29981ef1f664564c3edeb0a9415fcef69ef --- /dev/null +++ b/8b7178b44b/global_step84877/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:069371c989f2d6908c31af146223dd324e5b883940b6912b5eddbe7c4698c528 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5506cf1b3c3d13d3d2ce0294cb9bb3ae629127b0 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bd64fe73b4e59531a9e0c43e3b360fff5f6a9c64261cac1afdcdfdfb4da1198 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32f17c38c4fe2083ce05cafee4817b7361f35e37 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e82c78bd7acab803f578d33c1642cbfc739c4c27215fa9da82e7880d42279794 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c244019379d87a7a2042385953a13cdc26c900ab --- /dev/null +++ b/8b7178b44b/global_step84877/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faf6197f062fcc76875bc3e9d7c90538175174112d75b22828a67cb968954de2 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d348b8e1bba8f5bb9e4eb43cce43d63951d28e7 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af9c1b6581b53288823a7507be0041a7699b4a9cb83b6181077771c180dff1ed +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe5636352eb1cb5a6a6cd0c390a3e233f5f7758c --- /dev/null +++ b/8b7178b44b/global_step84877/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e856962b83db6fb61473fa35cd18049b0155cb0548e38158cee5ad56f6355908 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe172059c819eff0dffb21ad010f420a5f6afa0b --- /dev/null +++ b/8b7178b44b/global_step84877/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecd82c93c2e1c12a1e16ae9eaa0599079be56e650d8b37282652910ebabb39ca +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4ddf8d0ba9bf06ece35bcf839a0880d42da1f55 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32366d6f6d50d0b26544b01b55b607b12d9644447960da6c51867dcb69df0810 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4af27ec7101c9030c6f14667020d691e80f0bc01 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_39-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21e0f55d1bdc5e05f981ba48bcbf32e4456874e575f6ac2894505a16a9282907 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a63f3fdb1022369cbe3cf194d30a4455f4ad97e0 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_39-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba86d7b7e0960a04157acaf3c356c8f4c83003d9602046d60baf164bb46fc6fb +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d762be80946b9e407184c8bf719b19b642f5456 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb6c609450f26b02e2553293b073da5379dd108fe943acff0806d4a711b8b2bd +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be0b90674db982872376a827825be0290ab3de78 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f8bc470a162c0c0c115f2b2bb0e2aa11e0f218637b1ecccb063aba27a0a916b +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94163cfb35a1ab564c4803e3d86afd4474532017 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_41-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89f5fb8d562ae7fb747c879accfabe20950145f35497043763d22e1f81962ec5 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddc98db95a91f69f4184283855d777d45faa1d77 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_41-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae4450d682ba41b612eea1db73961358403d439b9e366a88b118cff006f34d1f +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f17df8e51cc1eb87fe2deb4e09c4272529387e5 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_42-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:747c658ab09278ab26404cb88431b9c664d7ea7a78e07b4d826edb4d1b799932 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64c07baf9fbb0087f6dde4d665482a6404cd0e37 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_42-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8df0359137b1e6452d0b84f8324edc3fb019276561966e149701d7d08e347ca +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6462cd5c2c11920ff1782078c2344b0c6441c509 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_43-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edc70f898ef7a4da2dec6a160745da0bae0ddbeba9c52e46625b53358a0ca99b +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb190ff2c3a86785a9cff334c4f69f0ed6b12cb7 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_43-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ad0c82e5f83a05013708b23c9382be1b609714302fc2af155c236cff3a172bd +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2cd1ad3541e8172b7eb496b619dffbcac29a015 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_44-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8065163702fc7c38b132711da6099e42b296944755517cb37c24eea7ed02107 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d315f2b87353a5b9aee8d0f93da9688ec6c2eb7e --- /dev/null +++ b/8b7178b44b/global_step84877/layer_44-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af8da1d8e14836ef1c3c274cb33b90410145f4d527f1a9df3f2442b48f3cb0b8 +size 201408771 diff --git a/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt b/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64633703869b8b89135bc49035539aa5fcc61943 --- /dev/null +++ b/8b7178b44b/global_step84877/layer_46-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4ec42679103d4de50528e66527df0f2d825996cd731aec93d1dd26e0da33db3 +size 17603 diff --git a/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt b/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4694473c0c158f3239465c71e2904354644f2dae --- /dev/null +++ b/8b7178b44b/global_step84877/layer_46-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13534d1ef189338678a2cf8dd23db72beb0f0770cd22cdeffd3315c90afa0c34 +size 17603 diff --git a/8b7178b44b/global_step84877/mp_rank_00_model_states.pt b/8b7178b44b/global_step84877/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86830b6a8cd4cc1dae745e0a336cb4063ce72fb4 --- /dev/null +++ b/8b7178b44b/global_step84877/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e1346fafe98f773c201d386fa0e85cc2b1c14ef89f61e2c6b31e950327bab21 +size 40115 diff --git a/8b7178b44b/global_step84877/mp_rank_01_model_states.pt b/8b7178b44b/global_step84877/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7ad82f0e7ee7198a6726d8d0ca5ca80bcbb381b --- /dev/null +++ b/8b7178b44b/global_step84877/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd8dedc82c86c0a61159442e8e9dec4a02a3daa874171c028f4497be15529d75 +size 40115 diff --git a/8b7178b44b/global_step84877/mp_rank_02_model_states.pt b/8b7178b44b/global_step84877/mp_rank_02_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee7fb2826b9048f629a2f8a985cf633a7f72ba96 --- /dev/null +++ b/8b7178b44b/global_step84877/mp_rank_02_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cabd4ec39eec7621d6b0cb99e14a19e745d749e2c4bb5dc78009df8865ec452 +size 40243 diff --git a/8b7178b44b/global_step84877/mp_rank_03_model_states.pt b/8b7178b44b/global_step84877/mp_rank_03_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6d9e7fddeed6607b54ba8df1cf953333b249bd1 --- /dev/null +++ b/8b7178b44b/global_step84877/mp_rank_03_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25fe617d2b7a771ea4399ad091336b7415bc7b220ce66d659946d010f272af5a +size 40243 diff --git a/8b7178b44b/transformers/config.json b/8b7178b44b/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..eadf3eb13cecae9db1c34cde4f4d373a9d0fe00f --- /dev/null +++ b/8b7178b44b/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 4096, "n_layer": 42, "n_head": 32, "n_inner": 16384, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/8b7178b44b/transformers/pytorch_model.bin b/8b7178b44b/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..f0e8a819d9ef86e2559da8a48d37b30a859673bf --- /dev/null +++ b/8b7178b44b/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10887e0fea58113cd861209728d00113f3fccc5c9de9193053e6b4dbd128a54a +size 17698351197 diff --git a/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-web_nlg_en_PALM_prompt_0.json b/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..11cc337b7e0857cb3019b83cba2fa9617acea05e --- /dev/null +++ b/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.3018678413532531, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.02844023781425127}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07529613947856881, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001982838396838402}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3128650370000908, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0050801382033981305}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10892691674779821, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019071235551653418}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03417694669369951, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001313368572681446}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.14493621807358514, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0032191726931486194}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.049040742381146675, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011519113898695909}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07180450626627975, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001883124040127771}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.30107392723259574, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004911398619361963}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10396046493580034, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001778756221046735}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.0720836832710309, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001909971490636727}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.29709085493162957, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004719450806012623}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10404327940071008, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001820581250965178}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-web_nlg_en_PALM_prompt_1.json b/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..233d280faa7d1a0c8969d8188f59b77fa87a9793 --- /dev/null +++ b/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5232740840707778, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.020854898797383486}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.14535656258632043, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00467037788995567}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.32467105717536826, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004844586825107793}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.1654988415912321, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003746858529251122}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.07725516531902364, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0033727094011323654}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.16618004223187002, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003573100663317745}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.08445836822356238, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0026512482133539865}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.1318447100821655, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004146806578291652}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.30561460626596343, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004514632290906585}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1515457985267535, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003242282817029173}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.1339783021316465, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004209899048276762}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3075713065076715, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004515232151240997}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.15355200233921673, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0032933307640919023}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-web_nlg_en_PALM_prompt_2.json b/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..36e4f99d543494c1fd797cae0fef1a6ae9dae325 --- /dev/null +++ b/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.8216652782232776, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04062910442416713}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.18008691481284958, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0052757038925836395}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3711673998047281, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00487879034297811}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.2027123169825771, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004395624756947157}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.10008962637316307, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0037529405438827225}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20016469360773192, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003813720451519567}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.10928693373297448, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.003154986876758784}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.15996735275766777, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004577626944141576}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3460684822761284, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004492766954524856}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.18244327655886838, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003749619328233065}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.1650914247834489, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00477544492053463}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3505702667663343, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004548048493270462}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.18698187602734404, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0038921774054845996}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-web_nlg_en_PALM_prompt_3.json b/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..157887852a043bbfa41bd45220e2d85c68952363 --- /dev/null +++ b/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.8830672069742221, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.028000457075678158}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.188815921549058, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005405782039170827}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.38372152833073453, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004859603610175178}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.21071007543003908, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004463218149424481}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.10432859230180822, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.003707124967324291}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.2043813472297843, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003801503662629156}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.11292635699291721, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0031281095189860052}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.16609714125737446, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004603337178258819}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3553325064502732, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0044309664783451575}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.18796910977796713, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003750496425693158}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.17111254219249275, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004780700019520514}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.36026081429848233, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004488184055350965}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1924829285681012, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0038880601940687624}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-web_nlg_en_PALM_prompt_4.json b/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..e3b9d58978bbf65864ecc8ea11211a8eb1e8d255 --- /dev/null +++ b/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 1.0358671081792514, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04263566752630496}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.19989615669545296, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005599957130646531}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.40336166710123866, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004818721124125534}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.22245843694786877, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0045583402573195686}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.1124336236373582, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.003935741095779227}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.21819990615637125, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00385618079142143}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.12100972003049645, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0032743404066677153}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.17492321519899293, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004773378480561351}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.37224158952457587, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004377948019839408}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.19760963957512798, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00383542084139647}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.18235385466161755, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.005021694344891093}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3793687467005697, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004423507289060084}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.20440757227679296, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.004022054785395138}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-web_nlg_en_PALM_prompt_5.json b/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..c355a835d8439fc23cddb5740186620e06614124 --- /dev/null +++ b/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 1.204171361933669, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07613961296168276}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.21975255516712816, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0060000476488098085}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4066635344523642, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0048262902071662655}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.2366466068769033, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0048055385839361016}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.1275911476917841, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.004309205748397978}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.2235792080539432, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003950954664759423}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.13171103508163604, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0034923443640983974}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.19131328031391062, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.005134255771123987}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.37336352525066424, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0044216260882892515}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.2088535130444153, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.004052842030593682}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.1997593788485136, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.005406525039653976}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3803285154915348, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004488995109880062}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.21625717477809833, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.004260506456488727}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-wiki_lingua_en_tldr_en_0.json b/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..3af52b5ed33e47b1d57d27c29b63df0192e944df --- /dev/null +++ b/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.12462462729719587, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031826046662497306}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.16449607884346923, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003588981148112544}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1238366627407439, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026637547390690967}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.030579818116461738, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001114447996676589}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.045348988871228374, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015776302264520795}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03307271090107231, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010639050828558138}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.09689369540491309, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0026833442642966994}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1273558135465041, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002838117953205465}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.0940193069900903, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001985212421750187}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.11762669226995941, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0030721629727453585}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.15435308236518808, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003394722386908597}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.11606269945283079, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0025094061265404873}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.7397274944771954, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10039261451919343}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-wiki_lingua_en_tldr_en_1.json b/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..4060e9529dd63dcc29b46d831fba32c3d33dc5a6 --- /dev/null +++ b/8b7178b88b/evaluation/generation/agg.8b7178b88b_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.2303358349811005, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003690727542733754}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2154464843014795, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00312287409246033}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.18706368194466189, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023760001514770367}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0623131824874716, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0021997319954224622}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05366477872164223, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015294014686067932}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04664136277906473, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012607234019787598}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1774352175816246, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003056714448069494}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.16262682837459477, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00239676054267987}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.14101873450061833, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017902413086473704}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.21694264697187762, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0035242626334641026}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2020549195476134, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0029196969560855153}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.175474051697367, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022207055448280263}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.980212171285624, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08986977717018042}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/agg.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_0.json b/8b7178b88b/evaluation/generation/agg.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..c28b59e6978d168b55fbd7a4abf4a2718b7ea7b4 --- /dev/null +++ b/8b7178b88b/evaluation/generation/agg.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 7.805428848697077, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.12760294204588482}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.27630659363671284, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0026635424916828915}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4517766787964781, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003086695070399088}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3241138419996619, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023488121086233404}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.1264233869651961, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0021472423489400424}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21006531093284228, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002273053133823739}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.14611347950675788, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001555781159556189}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.23647123285513574, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0021694427334222896}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.39302733892651276, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0026453773863021526}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2782112735172708, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017379173406301361}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.24330576145803912, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0025941508735257053}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3957393841813685, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0030500827793352625}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2838669853732326, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022710804975857187}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/agg.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_1.json b/8b7178b88b/evaluation/generation/agg.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..d65fb38ccb7e8abc6a51f1efc5447718745ee089 --- /dev/null +++ b/8b7178b88b/evaluation/generation/agg.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.182758345079787, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.16518841123830086}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6058724528221369, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0033311930729353}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4375685096869626, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003004503828354488}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4813086962286221, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023626326089443398}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.29572879977984745, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0029383694383037506}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.20878267638207582, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002207007421280634}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.23028289344422687, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021131218145040835}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4452525524920764, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003155514665754343}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.31741659640932457, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024579048629975297}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3505103154607651, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002138758436636428}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4958740637334028, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0033266551400865404}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.356592637216114, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027567285724463706}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.39279988924924625, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002377886979824964}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/agg.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_2.json b/8b7178b88b/evaluation/generation/agg.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..71c21859607a1c511987afaaa545d1d9b0b0dcf6 --- /dev/null +++ b/8b7178b88b/evaluation/generation/agg.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.77827774961412, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.17074445414549996}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6222132815532128, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032116680629870925}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4773787870946972, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002880300695039262}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5169724859470212, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022847828063681107}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.31734278580959246, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002901203617815359}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.23934523412335545, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022881777132200292}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2598408586362927, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002199049529931736}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.45801859712166865, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0030651884383412443}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3483543845938943, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002450753947224449}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.37830224304770604, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021704191814246308}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5166167827562745, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003243801734266107}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3956919145577125, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002759335166433648}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.42874770680726115, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00239536120318971}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/agg.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_3.json b/8b7178b88b/evaluation/generation/agg.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..4170f230951d9b3a6fa428e533e6f2f77fcf4e4c --- /dev/null +++ b/8b7178b88b/evaluation/generation/agg.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 15.660507663936528, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.14749957372060007}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6220372006914571, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031139706058727593}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4921683601168692, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029083346931655855}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5280713486662109, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022869985346214445}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.31964099722948836, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002777708595069122}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2509916858334456, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023901154240661446}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.26903286770558915, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0022307748577894758}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.455321793928234, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029321326061168074}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.35903739623304465, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025252866229682975}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.38565827502841116, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0022144421481799675}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5172893895354551, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003153574847912617}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.40954269048002123, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002825679167152443}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4394144928671385, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002446885490860059}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/agg.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_4.json b/8b7178b88b/evaluation/generation/agg.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..2444f6c5de2ba9c92766629526726b277f7a83a2 --- /dev/null +++ b/8b7178b88b/evaluation/generation/agg.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 16.046714521986758, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.20143548468737246}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6240126615936337, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00312720979038774}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4989840309368499, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028177351641601373}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5343300631658281, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002276059193634907}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.3206493529913017, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0028268414398358497}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2544472343665272, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0024038250271984246}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2724112279454815, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0022911561617215254}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4530934873979934, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029431217749683455}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3614836535348617, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025050776663639207}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.38733097602553734, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0022465126119210273}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5210977780903223, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003193746615616614}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.41707944621670306, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002802635738849298}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4465935641244627, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024867305930155463}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/agg.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_5.json b/8b7178b88b/evaluation/generation/agg.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..1d7d5986d882e42fe6f7531f8d05ef458697ddcf --- /dev/null +++ b/8b7178b88b/evaluation/generation/agg.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 16.068878582309953, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.16081121483163321}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6224102862193265, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003110234568961701}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.500933748593845, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027924958992030795}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5355837269029773, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002256980681599985}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.32190257045006593, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0027959933340407817}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2569886621162686, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002381426382114005}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.27475970807249195, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0022615182075459324}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.45606984360921154, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002956375747033492}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3657446339488385, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002509353106433301}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3914922502865105, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0022467536238069325}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5210361752122326, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003175466781222956}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4190489396414274, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027531052100554392}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4482824729485371, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002444818682804833}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/agg.8b7178b88b_gem_xsum_article_DOC_summary_0.json b/8b7178b88b/evaluation/generation/agg.8b7178b88b_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..5e005cf0528c4f4d6dc78d0436052d00dacca1ff --- /dev/null +++ b/8b7178b88b/evaluation/generation/agg.8b7178b88b_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12872236323811218, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032462823876021106}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2715393984942335, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005900736678094209}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.16636180556058044, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003516551179676636}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.028024322491153688, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011655819703985627}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06517448572813263, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002766560068276156}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03841432091372367, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001586981058162795}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09534495061706572, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0027658531338571454}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.19816999370668548, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004414878706261276}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1211817583352299, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0025835665514872593}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10514740754117864, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0028961374555318475}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.22067225131355028, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004901108311721729}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13466615178498392, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002869955857600535}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.9818055644823127, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.13978823814879407}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/agg.8b7178b88b_gem_xsum_article_DOC_summary_1.json b/8b7178b88b/evaluation/generation/agg.8b7178b88b_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..7c4f0860596bf1df1ecf1399af535fc0ca1f976f --- /dev/null +++ b/8b7178b88b/evaluation/generation/agg.8b7178b88b_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.23797749292717868, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0044248829684158586}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.23607563998039394, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0037207865629804763}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.2252201544517192, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003572521220076497}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.05608458865614393, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026939326656790527}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0508692034245319, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022931658802725287}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.05054236360888691, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0023023749748183903}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.18150902719333478, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0036305277559064066}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.179561582857957, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003045132003822578}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1713099421580951, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0029320038478532935}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.18366739499452403, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003629882854081677}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.18297857106589824, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003137997544172217}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.17382401249824367, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0029535439613312367}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.718621562424974, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.25634902183378955}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/agg.8b7178b88b_gem_xsum_article_DOC_summary_2.json b/8b7178b88b/evaluation/generation/agg.8b7178b88b_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..d894da0ba6b154c3fd433a7cfbf3296861f5a7df --- /dev/null +++ b/8b7178b88b/evaluation/generation/agg.8b7178b88b_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.26927175770553385, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004455761662742256}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.25342716562216744, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0038549474849294127}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.2516525371976862, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0037511199505683374}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.06831364960977458, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0028257306475568847}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06217985063286193, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0025187198385362495}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.06264124531231369, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0025022071058794777}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.20401963131847098, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0036937944194900436}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.19255452445504442, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0032146416769602863}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.19077644710608424, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003126557023491442}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.20564280351844771, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003691582561213757}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.1946786446186705, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0032424612854966943}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.19254279514804024, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00313403184014492}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 3.6613673832300515, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.29305939325429936}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_0.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4c73f69f53c08e8c5740a137ecfca4c357311347 --- /dev/null +++ b/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5ef06f89f788b473f0abd2b7453e7b622de262fd2ca2e4ec6ee9d8c8db054b0 +size 4071362 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_1.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..bbcf607a15112a1126f9c288c011d109af066326 --- /dev/null +++ b/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba1f76b6b2f1c9c10696db4ec5f33d226401bc579df4fa65a45675643f1969af +size 4695595 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_2.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2bf199391fce07928d552cc878bfbbd479b54aec --- /dev/null +++ b/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3889dbbc34b17469d8d15bd566ef15b4f4bfc56fe3a7bb6739fa7d2b41590eae +size 5548176 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_3.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c78307997b7b2ccca20251f8dfb54ae84971bec6 --- /dev/null +++ b/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:153f25db066af474f6cb0deead10c2afc97af1160a13547c93530e66cd0909da +size 6474285 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_4.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2d253c573429b51cec409a5a3f2d7eea2e44a8cc --- /dev/null +++ b/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10aab6241ccb5b71958061a71745b1d4e58d05a0d7ba975ec977761451c29daf +size 7367315 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_5.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d5035e49c21173cb72559cf5e3ffe46f7f3172c5 --- /dev/null +++ b/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dc5f9fac043e02d168cc6e9d610ed68b9856eec2e9306547c2d1b28564d85d8 +size 8218091 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-wiki_lingua_en_tldr_en_0.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3b001021f5c3af6faa11dda78d62e8f57f6636dd --- /dev/null +++ b/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a52a729eb6fc2aa6ac2a07e07cf7d52fabeaf752436ba097404ffcd340a91a0 +size 7293299 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-wiki_lingua_en_tldr_en_1.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b906dc3a57ce33c77279be146fd941771099ce39 --- /dev/null +++ b/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cefdc20d2b9c713956962ce57cc918f4ee2fe249aa8a7a467204df0a242fde5f +size 12999255 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-wiki_lingua_en_tldr_en_2.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-wiki_lingua_en_tldr_en_3.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-wiki_lingua_en_tldr_en_4.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-wiki_lingua_en_tldr_en_5.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..136a383020a6c833c408a59854dceacf10040d58 --- /dev/null +++ b/8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0d7fa6a82d586ff3e5ea9048ff652342cc4a47d3afc53dac46c85a986a9a348 +size 4335793 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..91904326f5728d571efb1bc37af7e0c49a4b0b40 --- /dev/null +++ b/8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cb1c74d4fdb29c97be8e44857c10337ec89453f857b86eed2a24ba5fd09f322 +size 4984146 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c725bd0741a255333a6440e931dfdfdc4cb23e10 --- /dev/null +++ b/8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d91d05640526e59a16caefa9f06146123fba7ff7a850ed1e99e61d2b935cf518 +size 6082973 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..059cb211671b37dd62ec85494c0da889ac9fe367 --- /dev/null +++ b/8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4af087a4f066e6f16d3f58de682ea4d716667c87693519b836f5c385ba2e04f0 +size 7172275 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..dea93d6a47a1b66ba7c31f265d11754c60ed685f --- /dev/null +++ b/8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1a641265cbd8eac74992cc4a920231ff46bd412f1b9679833b4f3a85a5a7e31 +size 8254389 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0c06ba26f5fae012f1149d83ffdf7c06d4fb341b --- /dev/null +++ b/8b7178b88b/evaluation/generation/examples.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b53e562da07c9c8d57c03a7ee00e623a9ec6d578dc20692a64942c046107660b +size 9342876 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_0.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..65b4e3a0bbf19a64fd46953b22eedb2dfbc7f780 --- /dev/null +++ b/8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c978bc629deb8c8c8232e4e1af5a285512a66f803926d1e377654d4e385299d5 +size 2750606 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_1.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d1ac08302a90cb69439cca9a4ddf74f69bb2c2c6 --- /dev/null +++ b/8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e46165684467d440e3d9f3f01692cbb72acd3a4eafa561a6fd4404d300c9b08 +size 4911785 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_2.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..9a1d8a3a4704f018935781f3892cb252a67c28e8 --- /dev/null +++ b/8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2c0257a184e74574462c6deb94896347e1a7cb8a67aedab6cc8d5fc6a55f62e +size 7172095 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_3.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_4.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_5.jsonl b/8b7178b88b/evaluation/generation/examples.8b7178b88b_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-web_nlg_en_PALM_prompt_0.json b/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..88c6c7c9c0a522ff8516b656ffef03c665aff1a1 --- /dev/null +++ b/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.3018678413532531, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.02844023781425127 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07529613947856881, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001982838396838402 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3128650370000908, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0050801382033981305 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10892691674779821, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019071235551653418 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03417694669369951, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001313368572681446 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.14493621807358514, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0032191726931486194 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.049040742381146675, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011519113898695909 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07180450626627975, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001883124040127771 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.30107392723259574, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004911398619361963 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10396046493580034, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001778756221046735 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.0720836832710309, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001909971490636727 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.29709085493162957, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004719450806012623 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10404327940071008, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001820581250965178 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-web_nlg_en_PALM_prompt_1.json b/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..0d9f7821842bdd8536d5127a541a6597649fac15 --- /dev/null +++ b/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5232740840707778, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.020854898797383486 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.14535656258632043, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.00467037788995567 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.32467105717536826, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004844586825107793 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.1654988415912321, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.003746858529251122 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.07725516531902364, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0033727094011323654 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.16618004223187002, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003573100663317745 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.08445836822356238, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0026512482133539865 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.1318447100821655, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004146806578291652 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.30561460626596343, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004514632290906585 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1515457985267535, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003242282817029173 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.1339783021316465, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004209899048276762 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3075713065076715, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004515232151240997 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.15355200233921673, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0032933307640919023 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-web_nlg_en_PALM_prompt_2.json b/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..a9debf5ef019e8af9f42ad370002290ae2b2ba82 --- /dev/null +++ b/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.8216652782232776, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04062910442416713 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.18008691481284958, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0052757038925836395 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3711673998047281, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00487879034297811 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.2027123169825771, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004395624756947157 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.10008962637316307, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0037529405438827225 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20016469360773192, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003813720451519567 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.10928693373297448, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.003154986876758784 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.15996735275766777, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004577626944141576 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3460684822761284, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004492766954524856 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.18244327655886838, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003749619328233065 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.1650914247834489, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.00477544492053463 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3505702667663343, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004548048493270462 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.18698187602734404, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0038921774054845996 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-web_nlg_en_PALM_prompt_3.json b/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..ef0fcaec64ead26b87edc3d43cc7b68edd040fe1 --- /dev/null +++ b/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.8830672069742221, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.028000457075678158 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.188815921549058, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005405782039170827 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.38372152833073453, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004859603610175178 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.21071007543003908, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004463218149424481 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.10432859230180822, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.003707124967324291 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.2043813472297843, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003801503662629156 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.11292635699291721, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0031281095189860052 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.16609714125737446, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004603337178258819 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3553325064502732, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0044309664783451575 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.18796910977796713, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003750496425693158 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.17111254219249275, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004780700019520514 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.36026081429848233, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004488184055350965 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1924829285681012, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0038880601940687624 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-web_nlg_en_PALM_prompt_4.json b/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..314e833fbb3baf97407218f5d451047f158b0ee0 --- /dev/null +++ b/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 1.0358671081792514, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04263566752630496 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.19989615669545296, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005599957130646531 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.40336166710123866, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004818721124125534 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.22245843694786877, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0045583402573195686 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.1124336236373582, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.003935741095779227 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.21819990615637125, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.00385618079142143 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.12100972003049645, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0032743404066677153 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.17492321519899293, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004773378480561351 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.37224158952457587, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004377948019839408 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.19760963957512798, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.00383542084139647 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.18235385466161755, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.005021694344891093 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3793687467005697, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004423507289060084 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.20440757227679296, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.004022054785395138 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-web_nlg_en_PALM_prompt_5.json b/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..5719a0ac51c97abbfc11a4b4c652c96a18e6531f --- /dev/null +++ b/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 1.204171361933669, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.07613961296168276 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.21975255516712816, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0060000476488098085 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4066635344523642, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0048262902071662655 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.2366466068769033, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0048055385839361016 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.1275911476917841, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.004309205748397978 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.2235792080539432, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003950954664759423 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.13171103508163604, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0034923443640983974 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.19131328031391062, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.005134255771123987 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.37336352525066424, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0044216260882892515 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.2088535130444153, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.004052842030593682 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.1997593788485136, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.005406525039653976 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3803285154915348, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004488995109880062 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.21625717477809833, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.004260506456488727 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-wiki_lingua_en_tldr_en_0.json b/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..28d6a9887a25793cce84976b2fdd890057d6cd73 --- /dev/null +++ b/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.12462462729719587, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0031826046662497306 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.16449607884346923, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.003588981148112544 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1238366627407439, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0026637547390690967 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.030579818116461738, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001114447996676589 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.045348988871228374, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015776302264520795 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03307271090107231, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010639050828558138 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.09689369540491309, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0026833442642966994 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1273558135465041, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002838117953205465 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.0940193069900903, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001985212421750187 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.11762669226995941, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0030721629727453585 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.15435308236518808, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.003394722386908597 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.11606269945283079, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0025094061265404873 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.7397274944771954, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.10039261451919343 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-wiki_lingua_en_tldr_en_1.json b/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..f591d85292a95b3aed4b1e124eaaf0ebb1071783 --- /dev/null +++ b/8b7178b88b/evaluation/generation/slim.8b7178b88b_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.2303358349811005, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.003690727542733754 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2154464843014795, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00312287409246033 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.18706368194466189, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0023760001514770367 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0623131824874716, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0021997319954224622 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05366477872164223, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015294014686067932 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04664136277906473, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012607234019787598 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1774352175816246, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.003056714448069494 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.16262682837459477, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00239676054267987 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.14101873450061833, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0017902413086473704 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.21694264697187762, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0035242626334641026 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2020549195476134, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0029196969560855153 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.175474051697367, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022207055448280263 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.980212171285624, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.08986977717018042 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/slim.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_0.json b/8b7178b88b/evaluation/generation/slim.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..7f30b0c2ac6c5f5bf3498623a2671fe69d643a1b --- /dev/null +++ b/8b7178b88b/evaluation/generation/slim.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 7.805428848697077, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.12760294204588482 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.27630659363671284, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0026635424916828915 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4517766787964781, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.003086695070399088 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3241138419996619, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0023488121086233404 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.1264233869651961, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0021472423489400424 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21006531093284228, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002273053133823739 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.14611347950675788, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001555781159556189 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.23647123285513574, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0021694427334222896 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.39302733892651276, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0026453773863021526 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2782112735172708, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0017379173406301361 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.24330576145803912, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0025941508735257053 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3957393841813685, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0030500827793352625 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2838669853732326, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022710804975857187 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/slim.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_1.json b/8b7178b88b/evaluation/generation/slim.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..40699160cad708c8738c07f271eaba12864b6c91 --- /dev/null +++ b/8b7178b88b/evaluation/generation/slim.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.182758345079787, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.16518841123830086 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6058724528221369, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0033311930729353 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4375685096869626, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.003004503828354488 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4813086962286221, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0023626326089443398 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.29572879977984745, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0029383694383037506 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.20878267638207582, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002207007421280634 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.23028289344422687, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0021131218145040835 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4452525524920764, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.003155514665754343 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.31741659640932457, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024579048629975297 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3505103154607651, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002138758436636428 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4958740637334028, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0033266551400865404 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.356592637216114, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027567285724463706 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.39279988924924625, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002377886979824964 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/slim.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_2.json b/8b7178b88b/evaluation/generation/slim.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..88c01066d0d69c15d358b54c126b9d96da070405 --- /dev/null +++ b/8b7178b88b/evaluation/generation/slim.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.77827774961412, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.17074445414549996 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6222132815532128, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032116680629870925 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4773787870946972, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002880300695039262 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5169724859470212, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022847828063681107 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.31734278580959246, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002901203617815359 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.23934523412335545, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022881777132200292 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2598408586362927, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002199049529931736 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.45801859712166865, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0030651884383412443 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3483543845938943, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002450753947224449 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.37830224304770604, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021704191814246308 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5166167827562745, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003243801734266107 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3956919145577125, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002759335166433648 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.42874770680726115, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00239536120318971 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/slim.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_3.json b/8b7178b88b/evaluation/generation/slim.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..a98796d1a754c4e083c4d9d6ef2329dde8f22275 --- /dev/null +++ b/8b7178b88b/evaluation/generation/slim.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 15.660507663936528, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.14749957372060007 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6220372006914571, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031139706058727593 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4921683601168692, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029083346931655855 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5280713486662109, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022869985346214445 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.31964099722948836, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002777708595069122 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2509916858334456, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023901154240661446 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.26903286770558915, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0022307748577894758 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.455321793928234, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029321326061168074 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.35903739623304465, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025252866229682975 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.38565827502841116, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0022144421481799675 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5172893895354551, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003153574847912617 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.40954269048002123, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002825679167152443 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4394144928671385, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002446885490860059 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/slim.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_4.json b/8b7178b88b/evaluation/generation/slim.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..a79d55adea920a7f66aeeff0b1b12b23784057fb --- /dev/null +++ b/8b7178b88b/evaluation/generation/slim.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 16.046714521986758, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.20143548468737246 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6240126615936337, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.00312720979038774 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4989840309368499, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028177351641601373 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5343300631658281, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002276059193634907 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.3206493529913017, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0028268414398358497 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2544472343665272, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0024038250271984246 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2724112279454815, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0022911561617215254 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4530934873979934, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029431217749683455 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3614836535348617, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025050776663639207 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.38733097602553734, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0022465126119210273 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5210977780903223, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003193746615616614 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.41707944621670306, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002802635738849298 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4465935641244627, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0024867305930155463 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/slim.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_5.json b/8b7178b88b/evaluation/generation/slim.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..d2ef1fd385aa4656db6deff16ca2ca7c332d8e56 --- /dev/null +++ b/8b7178b88b/evaluation/generation/slim.8b7178b88b_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 16.068878582309953, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.16081121483163321 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6224102862193265, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003110234568961701 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.500933748593845, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027924958992030795 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5355837269029773, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002256980681599985 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.32190257045006593, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0027959933340407817 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2569886621162686, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002381426382114005 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.27475970807249195, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0022615182075459324 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.45606984360921154, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002956375747033492 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3657446339488385, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002509353106433301 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3914922502865105, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0022467536238069325 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5210361752122326, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003175466781222956 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4190489396414274, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027531052100554392 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4482824729485371, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002444818682804833 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/slim.8b7178b88b_gem_xsum_article_DOC_summary_0.json b/8b7178b88b/evaluation/generation/slim.8b7178b88b_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..05e3b2a5326457be73fbdd7655932617d913e98a --- /dev/null +++ b/8b7178b88b/evaluation/generation/slim.8b7178b88b_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12872236323811218, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0032462823876021106 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2715393984942335, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.005900736678094209 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.16636180556058044, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.003516551179676636 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.028024322491153688, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0011655819703985627 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06517448572813263, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002766560068276156 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03841432091372367, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001586981058162795 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09534495061706572, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0027658531338571454 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.19816999370668548, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.004414878706261276 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1211817583352299, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0025835665514872593 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10514740754117864, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0028961374555318475 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.22067225131355028, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.004901108311721729 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13466615178498392, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002869955857600535 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.9818055644823127, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.13978823814879407 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/slim.8b7178b88b_gem_xsum_article_DOC_summary_1.json b/8b7178b88b/evaluation/generation/slim.8b7178b88b_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..c62bc575eafe247cfa2fcdab9d662444036fb96e --- /dev/null +++ b/8b7178b88b/evaluation/generation/slim.8b7178b88b_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.23797749292717868, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0044248829684158586 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.23607563998039394, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0037207865629804763 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.2252201544517192, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.003572521220076497 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.05608458865614393, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0026939326656790527 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0508692034245319, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0022931658802725287 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.05054236360888691, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0023023749748183903 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.18150902719333478, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0036305277559064066 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.179561582857957, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003045132003822578 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1713099421580951, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0029320038478532935 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.18366739499452403, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.003629882854081677 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.18297857106589824, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003137997544172217 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.17382401249824367, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0029535439613312367 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.718621562424974, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.25634902183378955 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/generation/slim.8b7178b88b_gem_xsum_article_DOC_summary_2.json b/8b7178b88b/evaluation/generation/slim.8b7178b88b_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..9bb03e40c79d2a50d9497b3b53975b3b77ea4dde --- /dev/null +++ b/8b7178b88b/evaluation/generation/slim.8b7178b88b_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.26927175770553385, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.004455761662742256 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.25342716562216744, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0038549474849294127 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.2516525371976862, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0037511199505683374 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.06831364960977458, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0028257306475568847 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06217985063286193, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0025187198385362495 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.06264124531231369, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0025022071058794777 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.20401963131847098, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0036937944194900436 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.19255452445504442, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0032146416769602863 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.19077644710608424, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.003126557023491442 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.20564280351844771, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.003691582561213757 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.1946786446186705, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0032424612854966943 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.19254279514804024, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.00313403184014492 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 3.6613673832300515, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.29305939325429936 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b88b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/rankeval/8b7178b88b_0.json b/8b7178b88b/evaluation/rankeval/8b7178b88b_0.json new file mode 100644 index 0000000000000000000000000000000000000000..3a6ae496e9f35cb4e578ca4c85f7bfb731142f36 --- /dev/null +++ b/8b7178b88b/evaluation/rankeval/8b7178b88b_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.328, + "acc_stderr": 0.014853842487270334 + }, + "anli_r2": { + "acc": 0.344, + "acc_stderr": 0.015029633724408943 + }, + "anli_r3": { + "acc": 0.38333333333333336, + "acc_stderr": 0.014041190711780102 + }, + "cb": { + "acc": 0.3392857142857143, + "acc_stderr": 0.06384226561930825, + "f1": 0.22990271377368152 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.04408440022768077 + }, + "hellaswag": { + "acc": 0.4500099581756622, + "acc_stderr": 0.004964779805180658, + "acc_norm": 0.5852419836685919, + "acc_norm_stderr": 0.004916733258140278 + }, + "rte": { + "acc": 0.4693140794223827, + "acc_stderr": 0.03003973059219781 + }, + "winogrande": { + "acc": 0.5643251775848461, + "acc_stderr": 0.013935709739615708 + }, + "storycloze_2016": { + "acc": 0.7022982362373063, + "acc_stderr": 0.010573790208173063 + }, + "boolq": { + "acc": 0.5345565749235474, + "acc_stderr": 0.008724144040604807 + }, + "arc_easy": { + "acc": 0.6203703703703703, + "acc_stderr": 0.009958037725468567, + "acc_norm": 0.5622895622895623, + "acc_norm_stderr": 0.010179856486006906 + }, + "arc_challenge": { + "acc": 0.2773037542662116, + "acc_stderr": 0.013082095839059374, + "acc_norm": 0.2935153583617747, + "acc_norm_stderr": 0.013307250444941118 + }, + "sciq": { + "acc": 0.86, + "acc_stderr": 0.010978183844357805, + "acc_norm": 0.793, + "acc_norm_stderr": 0.012818553557843984 + }, + "piqa": { + "acc": 0.7486398258977149, + "acc_stderr": 0.01012115601681926, + "acc_norm": 0.7529923830250272, + "acc_norm_stderr": 0.01006226814077264 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/rankeval/8b7178b88b_0_lm-eval_global_step84877_2023-01-30-20-00-12_0shots_backup.json b/8b7178b88b/evaluation/rankeval/8b7178b88b_0_lm-eval_global_step84877_2023-01-30-20-00-12_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..3a6ae496e9f35cb4e578ca4c85f7bfb731142f36 --- /dev/null +++ b/8b7178b88b/evaluation/rankeval/8b7178b88b_0_lm-eval_global_step84877_2023-01-30-20-00-12_0shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.328, + "acc_stderr": 0.014853842487270334 + }, + "anli_r2": { + "acc": 0.344, + "acc_stderr": 0.015029633724408943 + }, + "anli_r3": { + "acc": 0.38333333333333336, + "acc_stderr": 0.014041190711780102 + }, + "cb": { + "acc": 0.3392857142857143, + "acc_stderr": 0.06384226561930825, + "f1": 0.22990271377368152 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.04408440022768077 + }, + "hellaswag": { + "acc": 0.4500099581756622, + "acc_stderr": 0.004964779805180658, + "acc_norm": 0.5852419836685919, + "acc_norm_stderr": 0.004916733258140278 + }, + "rte": { + "acc": 0.4693140794223827, + "acc_stderr": 0.03003973059219781 + }, + "winogrande": { + "acc": 0.5643251775848461, + "acc_stderr": 0.013935709739615708 + }, + "storycloze_2016": { + "acc": 0.7022982362373063, + "acc_stderr": 0.010573790208173063 + }, + "boolq": { + "acc": 0.5345565749235474, + "acc_stderr": 0.008724144040604807 + }, + "arc_easy": { + "acc": 0.6203703703703703, + "acc_stderr": 0.009958037725468567, + "acc_norm": 0.5622895622895623, + "acc_norm_stderr": 0.010179856486006906 + }, + "arc_challenge": { + "acc": 0.2773037542662116, + "acc_stderr": 0.013082095839059374, + "acc_norm": 0.2935153583617747, + "acc_norm_stderr": 0.013307250444941118 + }, + "sciq": { + "acc": 0.86, + "acc_stderr": 0.010978183844357805, + "acc_norm": 0.793, + "acc_norm_stderr": 0.012818553557843984 + }, + "piqa": { + "acc": 0.7486398258977149, + "acc_stderr": 0.01012115601681926, + "acc_norm": 0.7529923830250272, + "acc_norm_stderr": 0.01006226814077264 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/rankeval/8b7178b88b_1.json b/8b7178b88b/evaluation/rankeval/8b7178b88b_1.json new file mode 100644 index 0000000000000000000000000000000000000000..d0ae856013a7afafad04a0dfe9e4af7fc41d77c7 --- /dev/null +++ b/8b7178b88b/evaluation/rankeval/8b7178b88b_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.314, + "acc_stderr": 0.014683991951087966 + }, + "anli_r2": { + "acc": 0.347, + "acc_stderr": 0.015060472031706615 + }, + "anli_r3": { + "acc": 0.3333333333333333, + "acc_stderr": 0.013613950010225606 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.06737697508644648, + "f1": 0.3421052631578947 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.45180242979486157, + "acc_stderr": 0.004966544724452226, + "acc_norm": 0.5972913762198765, + "acc_norm_stderr": 0.004894407257215795 + }, + "rte": { + "acc": 0.5018050541516246, + "acc_stderr": 0.030096267148976626 + }, + "winogrande": { + "acc": 0.5832675611681136, + "acc_stderr": 0.013856250072796316 + }, + "storycloze_2016": { + "acc": 0.7001603420630679, + "acc_stderr": 0.010595525174558607 + }, + "boolq": { + "acc": 0.5529051987767584, + "acc_stderr": 0.008695963064172729 + }, + "arc_easy": { + "acc": 0.6367845117845118, + "acc_stderr": 0.009868397136118798, + "acc_norm": 0.6376262626262627, + "acc_norm_stderr": 0.00986346820258377 + }, + "arc_challenge": { + "acc": 0.30204778156996587, + "acc_stderr": 0.013417519144716422, + "acc_norm": 0.32081911262798635, + "acc_norm_stderr": 0.013640943091946526 + }, + "sciq": { + "acc": 0.913, + "acc_stderr": 0.008916866630745916, + "acc_norm": 0.917, + "acc_norm_stderr": 0.00872852720607479 + }, + "piqa": { + "acc": 0.7453754080522307, + "acc_stderr": 0.010164432237060489, + "acc_norm": 0.749727965179543, + "acc_norm_stderr": 0.010106561880089767 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/rankeval/8b7178b88b_1_lm-eval_global_step84877_2023-01-30-20-00-12_1shots_backup.json b/8b7178b88b/evaluation/rankeval/8b7178b88b_1_lm-eval_global_step84877_2023-01-30-20-00-12_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..d0ae856013a7afafad04a0dfe9e4af7fc41d77c7 --- /dev/null +++ b/8b7178b88b/evaluation/rankeval/8b7178b88b_1_lm-eval_global_step84877_2023-01-30-20-00-12_1shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.314, + "acc_stderr": 0.014683991951087966 + }, + "anli_r2": { + "acc": 0.347, + "acc_stderr": 0.015060472031706615 + }, + "anli_r3": { + "acc": 0.3333333333333333, + "acc_stderr": 0.013613950010225606 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.06737697508644648, + "f1": 0.3421052631578947 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.45180242979486157, + "acc_stderr": 0.004966544724452226, + "acc_norm": 0.5972913762198765, + "acc_norm_stderr": 0.004894407257215795 + }, + "rte": { + "acc": 0.5018050541516246, + "acc_stderr": 0.030096267148976626 + }, + "winogrande": { + "acc": 0.5832675611681136, + "acc_stderr": 0.013856250072796316 + }, + "storycloze_2016": { + "acc": 0.7001603420630679, + "acc_stderr": 0.010595525174558607 + }, + "boolq": { + "acc": 0.5529051987767584, + "acc_stderr": 0.008695963064172729 + }, + "arc_easy": { + "acc": 0.6367845117845118, + "acc_stderr": 0.009868397136118798, + "acc_norm": 0.6376262626262627, + "acc_norm_stderr": 0.00986346820258377 + }, + "arc_challenge": { + "acc": 0.30204778156996587, + "acc_stderr": 0.013417519144716422, + "acc_norm": 0.32081911262798635, + "acc_norm_stderr": 0.013640943091946526 + }, + "sciq": { + "acc": 0.913, + "acc_stderr": 0.008916866630745916, + "acc_norm": 0.917, + "acc_norm_stderr": 0.00872852720607479 + }, + "piqa": { + "acc": 0.7453754080522307, + "acc_stderr": 0.010164432237060489, + "acc_norm": 0.749727965179543, + "acc_norm_stderr": 0.010106561880089767 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/rankeval/8b7178b88b_2.json b/8b7178b88b/evaluation/rankeval/8b7178b88b_2.json new file mode 100644 index 0000000000000000000000000000000000000000..39a60eb963ca1d8a47ef18134c20ef76b1c5ea87 --- /dev/null +++ b/8b7178b88b/evaluation/rankeval/8b7178b88b_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.296, + "acc_stderr": 0.014442734941575018 + }, + "anli_r2": { + "acc": 0.355, + "acc_stderr": 0.01513949154378053 + }, + "anli_r3": { + "acc": 0.3233333333333333, + "acc_stderr": 0.013508372867300222 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.28226120857699805 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.45737900816570404, + "acc_stderr": 0.004971619995879763, + "acc_norm": 0.6022704640509858, + "acc_norm_stderr": 0.004884287515461492 + }, + "rte": { + "acc": 0.47653429602888087, + "acc_stderr": 0.030063300411902652 + }, + "winogrande": { + "acc": 0.5698500394632992, + "acc_stderr": 0.013914685094716692 + }, + "storycloze_2016": { + "acc": 0.6996258685195083, + "acc_stderr": 0.010600915927985021 + }, + "boolq": { + "acc": 0.5724770642201835, + "acc_stderr": 0.008652692997177339 + }, + "arc_easy": { + "acc": 0.6384680134680135, + "acc_stderr": 0.009858506543162063, + "acc_norm": 0.6473063973063973, + "acc_norm_stderr": 0.009804420599378657 + }, + "arc_challenge": { + "acc": 0.3037542662116041, + "acc_stderr": 0.013438909184778755, + "acc_norm": 0.34215017064846415, + "acc_norm_stderr": 0.013864152159177278 + }, + "sciq": { + "acc": 0.923, + "acc_stderr": 0.008434580140240637, + "acc_norm": 0.926, + "acc_norm_stderr": 0.008282064512704159 + }, + "piqa": { + "acc": 0.7442872687704026, + "acc_stderr": 0.010178690109459857, + "acc_norm": 0.7546245919477693, + "acc_norm_stderr": 0.010039831320422386 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/rankeval/8b7178b88b_2_lm-eval_global_step84877_2023-01-30-20-00-12_2shots_backup.json b/8b7178b88b/evaluation/rankeval/8b7178b88b_2_lm-eval_global_step84877_2023-01-30-20-00-12_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..39a60eb963ca1d8a47ef18134c20ef76b1c5ea87 --- /dev/null +++ b/8b7178b88b/evaluation/rankeval/8b7178b88b_2_lm-eval_global_step84877_2023-01-30-20-00-12_2shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.296, + "acc_stderr": 0.014442734941575018 + }, + "anli_r2": { + "acc": 0.355, + "acc_stderr": 0.01513949154378053 + }, + "anli_r3": { + "acc": 0.3233333333333333, + "acc_stderr": 0.013508372867300222 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.28226120857699805 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.45737900816570404, + "acc_stderr": 0.004971619995879763, + "acc_norm": 0.6022704640509858, + "acc_norm_stderr": 0.004884287515461492 + }, + "rte": { + "acc": 0.47653429602888087, + "acc_stderr": 0.030063300411902652 + }, + "winogrande": { + "acc": 0.5698500394632992, + "acc_stderr": 0.013914685094716692 + }, + "storycloze_2016": { + "acc": 0.6996258685195083, + "acc_stderr": 0.010600915927985021 + }, + "boolq": { + "acc": 0.5724770642201835, + "acc_stderr": 0.008652692997177339 + }, + "arc_easy": { + "acc": 0.6384680134680135, + "acc_stderr": 0.009858506543162063, + "acc_norm": 0.6473063973063973, + "acc_norm_stderr": 0.009804420599378657 + }, + "arc_challenge": { + "acc": 0.3037542662116041, + "acc_stderr": 0.013438909184778755, + "acc_norm": 0.34215017064846415, + "acc_norm_stderr": 0.013864152159177278 + }, + "sciq": { + "acc": 0.923, + "acc_stderr": 0.008434580140240637, + "acc_norm": 0.926, + "acc_norm_stderr": 0.008282064512704159 + }, + "piqa": { + "acc": 0.7442872687704026, + "acc_stderr": 0.010178690109459857, + "acc_norm": 0.7546245919477693, + "acc_norm_stderr": 0.010039831320422386 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/rankeval/8b7178b88b_3.json b/8b7178b88b/evaluation/rankeval/8b7178b88b_3.json new file mode 100644 index 0000000000000000000000000000000000000000..17f461fadc06ac3b0e0419581413f52110b71138 --- /dev/null +++ b/8b7178b88b/evaluation/rankeval/8b7178b88b_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.32, + "acc_stderr": 0.014758652303574883 + }, + "anli_r2": { + "acc": 0.362, + "acc_stderr": 0.0152048409129195 + }, + "anli_r3": { + "acc": 0.32916666666666666, + "acc_stderr": 0.013570806258433625 + }, + "cb": { + "acc": 0.44642857142857145, + "acc_stderr": 0.06703189227942398, + "f1": 0.44163083293518074 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932261 + }, + "hellaswag": { + "acc": 0.45628360884286, + "acc_stderr": 0.004970672651595845, + "acc_norm": 0.602867954590719, + "acc_norm_stderr": 0.004883037758919965 + }, + "rte": { + "acc": 0.5523465703971119, + "acc_stderr": 0.02993107036293953 + }, + "winogrande": { + "acc": 0.6006314127861089, + "acc_stderr": 0.013764933546717612 + }, + "storycloze_2016": { + "acc": 0.7097808658471406, + "acc_stderr": 0.010495529690730063 + }, + "boolq": { + "acc": 0.5685015290519878, + "acc_stderr": 0.0086625945690273 + }, + "arc_easy": { + "acc": 0.6418350168350169, + "acc_stderr": 0.009838331651451848, + "acc_norm": 0.6452020202020202, + "acc_norm_stderr": 0.009817629113069694 + }, + "arc_challenge": { + "acc": 0.3097269624573379, + "acc_stderr": 0.01351205841523836, + "acc_norm": 0.3378839590443686, + "acc_norm_stderr": 0.013822047922283512 + }, + "sciq": { + "acc": 0.924, + "acc_stderr": 0.008384169266796403, + "acc_norm": 0.933, + "acc_norm_stderr": 0.007910345983177547 + }, + "piqa": { + "acc": 0.7464635473340587, + "acc_stderr": 0.010150090834551791, + "acc_norm": 0.7480957562568009, + "acc_norm_stderr": 0.010128421335088688 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/rankeval/8b7178b88b_3_lm-eval_global_step84877_2023-01-30-20-00-12_3shots_backup.json b/8b7178b88b/evaluation/rankeval/8b7178b88b_3_lm-eval_global_step84877_2023-01-30-20-00-12_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..17f461fadc06ac3b0e0419581413f52110b71138 --- /dev/null +++ b/8b7178b88b/evaluation/rankeval/8b7178b88b_3_lm-eval_global_step84877_2023-01-30-20-00-12_3shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.32, + "acc_stderr": 0.014758652303574883 + }, + "anli_r2": { + "acc": 0.362, + "acc_stderr": 0.0152048409129195 + }, + "anli_r3": { + "acc": 0.32916666666666666, + "acc_stderr": 0.013570806258433625 + }, + "cb": { + "acc": 0.44642857142857145, + "acc_stderr": 0.06703189227942398, + "f1": 0.44163083293518074 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932261 + }, + "hellaswag": { + "acc": 0.45628360884286, + "acc_stderr": 0.004970672651595845, + "acc_norm": 0.602867954590719, + "acc_norm_stderr": 0.004883037758919965 + }, + "rte": { + "acc": 0.5523465703971119, + "acc_stderr": 0.02993107036293953 + }, + "winogrande": { + "acc": 0.6006314127861089, + "acc_stderr": 0.013764933546717612 + }, + "storycloze_2016": { + "acc": 0.7097808658471406, + "acc_stderr": 0.010495529690730063 + }, + "boolq": { + "acc": 0.5685015290519878, + "acc_stderr": 0.0086625945690273 + }, + "arc_easy": { + "acc": 0.6418350168350169, + "acc_stderr": 0.009838331651451848, + "acc_norm": 0.6452020202020202, + "acc_norm_stderr": 0.009817629113069694 + }, + "arc_challenge": { + "acc": 0.3097269624573379, + "acc_stderr": 0.01351205841523836, + "acc_norm": 0.3378839590443686, + "acc_norm_stderr": 0.013822047922283512 + }, + "sciq": { + "acc": 0.924, + "acc_stderr": 0.008384169266796403, + "acc_norm": 0.933, + "acc_norm_stderr": 0.007910345983177547 + }, + "piqa": { + "acc": 0.7464635473340587, + "acc_stderr": 0.010150090834551791, + "acc_norm": 0.7480957562568009, + "acc_norm_stderr": 0.010128421335088688 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/rankeval/8b7178b88b_4.json b/8b7178b88b/evaluation/rankeval/8b7178b88b_4.json new file mode 100644 index 0000000000000000000000000000000000000000..589aa34adcc866d07d332cf6a596550a61315b3f --- /dev/null +++ b/8b7178b88b/evaluation/rankeval/8b7178b88b_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.328, + "acc_stderr": 0.014853842487270336 + }, + "anli_r2": { + "acc": 0.38, + "acc_stderr": 0.015356947477797577 + }, + "anli_r3": { + "acc": 0.3575, + "acc_stderr": 0.013840921245257796 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.3799029799029799 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.4539932284405497, + "acc_stderr": 0.00496861353930925, + "acc_norm": 0.6053574985062736, + "acc_norm_stderr": 0.004877748536428436 + }, + "rte": { + "acc": 0.5018050541516246, + "acc_stderr": 0.030096267148976626 + }, + "winogrande": { + "acc": 0.5832675611681136, + "acc_stderr": 0.013856250072796318 + }, + "storycloze_2016": { + "acc": 0.7204703367183325, + "acc_stderr": 0.010377702099704856 + }, + "boolq": { + "acc": 0.5596330275229358, + "acc_stderr": 0.008682635667686902 + }, + "arc_easy": { + "acc": 0.6456228956228957, + "acc_stderr": 0.009815004030251743, + "acc_norm": 0.6435185185185185, + "acc_norm_stderr": 0.009828046544504438 + }, + "arc_challenge": { + "acc": 0.2986348122866894, + "acc_stderr": 0.013374078615068756, + "acc_norm": 0.3216723549488055, + "acc_norm_stderr": 0.013650488084494162 + }, + "sciq": { + "acc": 0.921, + "acc_stderr": 0.008534156773333431, + "acc_norm": 0.938, + "acc_norm_stderr": 0.007629823996280307 + }, + "piqa": { + "acc": 0.7464635473340587, + "acc_stderr": 0.010150090834551782, + "acc_norm": 0.7529923830250272, + "acc_norm_stderr": 0.010062268140772644 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/rankeval/8b7178b88b_4_lm-eval_global_step84877_2023-01-30-20-00-12_4shots_backup.json b/8b7178b88b/evaluation/rankeval/8b7178b88b_4_lm-eval_global_step84877_2023-01-30-20-00-12_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..589aa34adcc866d07d332cf6a596550a61315b3f --- /dev/null +++ b/8b7178b88b/evaluation/rankeval/8b7178b88b_4_lm-eval_global_step84877_2023-01-30-20-00-12_4shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.328, + "acc_stderr": 0.014853842487270336 + }, + "anli_r2": { + "acc": 0.38, + "acc_stderr": 0.015356947477797577 + }, + "anli_r3": { + "acc": 0.3575, + "acc_stderr": 0.013840921245257796 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.3799029799029799 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.4539932284405497, + "acc_stderr": 0.00496861353930925, + "acc_norm": 0.6053574985062736, + "acc_norm_stderr": 0.004877748536428436 + }, + "rte": { + "acc": 0.5018050541516246, + "acc_stderr": 0.030096267148976626 + }, + "winogrande": { + "acc": 0.5832675611681136, + "acc_stderr": 0.013856250072796318 + }, + "storycloze_2016": { + "acc": 0.7204703367183325, + "acc_stderr": 0.010377702099704856 + }, + "boolq": { + "acc": 0.5596330275229358, + "acc_stderr": 0.008682635667686902 + }, + "arc_easy": { + "acc": 0.6456228956228957, + "acc_stderr": 0.009815004030251743, + "acc_norm": 0.6435185185185185, + "acc_norm_stderr": 0.009828046544504438 + }, + "arc_challenge": { + "acc": 0.2986348122866894, + "acc_stderr": 0.013374078615068756, + "acc_norm": 0.3216723549488055, + "acc_norm_stderr": 0.013650488084494162 + }, + "sciq": { + "acc": 0.921, + "acc_stderr": 0.008534156773333431, + "acc_norm": 0.938, + "acc_norm_stderr": 0.007629823996280307 + }, + "piqa": { + "acc": 0.7464635473340587, + "acc_stderr": 0.010150090834551782, + "acc_norm": 0.7529923830250272, + "acc_norm_stderr": 0.010062268140772644 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/rankeval/8b7178b88b_5.json b/8b7178b88b/evaluation/rankeval/8b7178b88b_5.json new file mode 100644 index 0000000000000000000000000000000000000000..8ee23e94a66094ed3b883e19004080a59f7bea69 --- /dev/null +++ b/8b7178b88b/evaluation/rankeval/8b7178b88b_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.32, + "acc_stderr": 0.014758652303574869 + }, + "anli_r2": { + "acc": 0.341, + "acc_stderr": 0.014998131348402706 + }, + "anli_r3": { + "acc": 0.32166666666666666, + "acc_stderr": 0.013490095282989521 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.36734693877551017 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909283 + }, + "hellaswag": { + "acc": 0.4540928101971719, + "acc_stderr": 0.004968705270086761, + "acc_norm": 0.6073491336387173, + "acc_norm_stderr": 0.004873421833291568 + }, + "rte": { + "acc": 0.5306859205776173, + "acc_stderr": 0.03003973059219781 + }, + "winogrande": { + "acc": 0.5864246250986582, + "acc_stderr": 0.013840971763195308 + }, + "storycloze_2016": { + "acc": 0.7172634954569749, + "acc_stderr": 0.01041380648612127 + }, + "boolq": { + "acc": 0.5626911314984709, + "acc_stderr": 0.008676043429497423 + }, + "arc_easy": { + "acc": 0.6388888888888888, + "acc_stderr": 0.00985601342581124, + "acc_norm": 0.6506734006734006, + "acc_norm_stderr": 0.009782853449399295 + }, + "arc_challenge": { + "acc": 0.30887372013651876, + "acc_stderr": 0.013501770929344003, + "acc_norm": 0.3395904436860068, + "acc_norm_stderr": 0.013839039762820164 + }, + "sciq": { + "acc": 0.921, + "acc_stderr": 0.008534156773333438, + "acc_norm": 0.933, + "acc_norm_stderr": 0.007910345983177547 + }, + "piqa": { + "acc": 0.7464635473340587, + "acc_stderr": 0.010150090834551786, + "acc_norm": 0.7524483133841132, + "acc_norm_stderr": 0.010069703966857116 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b88b/evaluation/rankeval/8b7178b88b_5_lm-eval_global_step84877_2023-01-30-20-00-12_5shots_backup.json b/8b7178b88b/evaluation/rankeval/8b7178b88b_5_lm-eval_global_step84877_2023-01-30-20-00-12_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..8ee23e94a66094ed3b883e19004080a59f7bea69 --- /dev/null +++ b/8b7178b88b/evaluation/rankeval/8b7178b88b_5_lm-eval_global_step84877_2023-01-30-20-00-12_5shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.32, + "acc_stderr": 0.014758652303574869 + }, + "anli_r2": { + "acc": 0.341, + "acc_stderr": 0.014998131348402706 + }, + "anli_r3": { + "acc": 0.32166666666666666, + "acc_stderr": 0.013490095282989521 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.36734693877551017 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909283 + }, + "hellaswag": { + "acc": 0.4540928101971719, + "acc_stderr": 0.004968705270086761, + "acc_norm": 0.6073491336387173, + "acc_norm_stderr": 0.004873421833291568 + }, + "rte": { + "acc": 0.5306859205776173, + "acc_stderr": 0.03003973059219781 + }, + "winogrande": { + "acc": 0.5864246250986582, + "acc_stderr": 0.013840971763195308 + }, + "storycloze_2016": { + "acc": 0.7172634954569749, + "acc_stderr": 0.01041380648612127 + }, + "boolq": { + "acc": 0.5626911314984709, + "acc_stderr": 0.008676043429497423 + }, + "arc_easy": { + "acc": 0.6388888888888888, + "acc_stderr": 0.00985601342581124, + "acc_norm": 0.6506734006734006, + "acc_norm_stderr": 0.009782853449399295 + }, + "arc_challenge": { + "acc": 0.30887372013651876, + "acc_stderr": 0.013501770929344003, + "acc_norm": 0.3395904436860068, + "acc_norm_stderr": 0.013839039762820164 + }, + "sciq": { + "acc": 0.921, + "acc_stderr": 0.008534156773333438, + "acc_norm": 0.933, + "acc_norm_stderr": 0.007910345983177547 + }, + "piqa": { + "acc": 0.7464635473340587, + "acc_stderr": 0.010150090834551786, + "acc_norm": 0.7524483133841132, + "acc_norm_stderr": 0.010069703966857116 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10683c70a1ba9cf393a25ef2d1c6d113f0ccc7b4 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de13bd47afbfcc575add31887fdb9757f1fbadfeeb45c541c024e716cda9f147 +size 208731415 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41efb0e8c8203e16e182906e32d75213c968b82c --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04062199ad8fc14a5711aa1e60a4436e6db28d7516a1a9f2951b2cfe4f45644 +size 208731415 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cf196d0d5c746c847e011f7b4008e1a27a67915 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c40bdc748d8ba4811102fce9aa956b2da751d8cad367d3dd5990877cc31bc62 +size 208732183 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b108c60e3d80f2dbfe745c98b4d601701732823b --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b08d376fb85ef9ed35d663719fc3bb75eefb256adf4af6ee88ffaf862e36813 +size 208732183 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e05b389b4401841bc0bf4fcc8ea1d379aa8c8d3 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6059f4fa1de7f0d2109cdbfb7c2f1bae3862665d4ca17d921b843ead41a6d75 +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3cecf3d2dfff0be4b8beac58935b9cef127d755 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ba154bb2e5195ffb46d24c7afcf9195da6bcf1b3b50667862cd5acb9333e57a +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_100_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_100_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c8b1f29df85e3aebb376d08506d7e968ae62473 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_100_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:227c55d85e0af7407f05812f7c6d6cca3851c449b58fea2608eac059b9f22478 +size 208732269 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_100_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_100_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..daa41213fc0fbf319ee017109293c64cdab5383b --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_100_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9c29e3dfb1b0c12ef80dca85ad9c62cd621d3ae9815ee8783dc9c2e99ac7bb7 +size 208732269 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..973af7adab8748190454628aba883633595fd2c0 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4909064133d6d5e920ee6a591e5fceb7d83aaa0aabef528a31116ce24513fd3 +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c39ff057a1b0deec1b3fe22c0371bca31bfb6298 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d6befa06a3430a1a47d3bb9e240d4c360146dd2444b6e25fb0ccc781517ba69 +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_101_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_101_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..731ab0658fa0a30f12f1b42d459937947559b509 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_101_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26858cac87bc60816854aac5cf142feefa4a0de05189a8d23f5ff8d3bda1ab2b +size 208732077 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_101_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_101_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5770529503546a66e7eb23de71b089df45e9320 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_101_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82f9e4b93bb275645d776e6894cbf18282593ba566d9e9385c6a63fbd56bc651 +size 208732077 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..643f791300582193260f2f9b2a1c0ad3d1e2211f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d309d59707221a7e7c4cef65bbed983cee2a293ab10e72d616108d3b5ab955f +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c617615a223311132d15bd5247e6d85993f6eb02 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c0adcd262842e38a5a5d8898940236383d93be3364d6a17b29e2a9c8a7ac784 +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_102_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_102_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6ef50c902befb90c504a8eecc89d0d6c82ce54a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_102_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c24218742bf38e857c6f758c6fb50f384f6f5e52dfa7a1cf0d998a89c81c5efc +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_102_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_102_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..edd9a3916b3b9edfcc5cc4b699747dd1b3cd94e1 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_102_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79ec2299889bd50c78432f7d051ad2c7cd6c0c79d5b67687e9a8b1ff842eda48 +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00aac7de0bbfeaf63a300ec6eb80e600192ca677 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd37b70e280eb66709536deaf91e4558639fc4be5a67afe2ee2cd817c0f3a791 +size 208731373 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38639dbf34f644860b53dac732d2d8021b365097 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ef71e57483af8f05deedc1c648129f238c3831ebaaf2430ce5198b0421a6516 +size 208731373 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_103_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_103_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5ac7c5a1e53edd7758ef847b8b145165835e4cb --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_103_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b98cbbc9c2464756d5b7bbdfb3abb496345e50f89685a5048c7dbf7a18e9f35 +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_103_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_103_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2f43400ccafd5729f4c78be21d324873367bedf --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_103_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5e277415513656d68e1f44741ca7a585d40ac13aeeb3b8009b3ade012ba7a42 +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bda625cec08b8b76f5a607b237f9a6ecf44d9c8a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02e8775b39377db26f3ef0252a1bb2a8a288ec1f6a56c6ed1478b1503a82f400 +size 208731501 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ffea7cd984655d99d7f56202b755fd3f5ac98f6 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc2e3e35b1cbc0744141e97901c095de9a9647af9f042b917e810af7cda70364 +size 208731501 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_104_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_104_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccbf7fcebda49ed5df3559dcbfdeea0a475941c8 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_104_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a90227ba6f8bff01b95b62767d2ae3ef6367241fb390d533563163c7d916c6c3 +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_104_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_104_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc58a77e86f8f69c52a6f9c6b56fac1d77495352 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_104_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5078830b91bf242d99e2e1a33053909c37efb07ca7d5a2ea83ec9c01a4ba1614 +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb00e5fbeb5948f7c1915eb54768148daec5cfe0 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad4993506bf7b8a976bed93f0c57f1b9e1556c51c93da19ca40b39ec2173a5d3 +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2deebb03639a7813d6257ef134370b75bbcb1108 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02817d495204ca6b91c5ea0220b3aa8c73ba54a762c632521512e37ed48548fe +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_105_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_105_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..447032d062b2a23809bdcef2decd26a3a5cd6662 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_105_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f374d114e52a4b9a2b4657afbee2a128de949e7723815837672c10bc5dd5f51 +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_105_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_105_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1ef55b2316a5f8acae9134bd2b2a81f33f7c94f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_105_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8808a5f71dc8bba7f7094e2d00d216f901b8d0a4e2e2f7e809ed294a2891dcdc +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..084facb1fe748192aa78ba001a5e415087a38815 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d21e8e9beb1315ff65b30eb6632a3a939ee71dab9f64848aa3cdcaaba469d25 +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c897662f5ece13c9989556ddedeef5b269ed2caa --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a909742f8a3cd9592d1bb460b27735863123c2a01828a9acbc7df669039beaf9 +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_106_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_106_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c3704a0c8cf010823ae6d1a83357d0a3b6231be --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_106_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad54e3c30f25108c852ebd799965f61d2e8a1c86299fcf17f5748505aafffd15 +size 208732269 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_106_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_106_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be3b8478722ffeb01f64951a2dc380dd823001b2 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_106_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f4a4c68cbfa7bcb8a6dffa1f1d950b64bf3ca6619f3e1e4bd0e90eb5e6c2d9b +size 208732269 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a74d2755369a80ffb11664e26c8d7a966f42e16 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1e032950565e6e3d5b7b16a28cff05acd7e790bd0dd4029c8d031125a63977a +size 208731501 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d6e3ae058064929fd6710d92f7a027e6f46b8fe --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df5bd6d1be8833efc1ce498e06585ad6e6832464f0c1240a0a4d4f5a0ece459d +size 208731501 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_107_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_107_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..991fc8dc8d6550edf4037bafc80894c18f4f32b3 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_107_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7767eda68bcae1644bf49d3eebbc1528f533290fb645e554a5c55dc34c3ae80d +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_107_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_107_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..637ab62873a8cca39fbd0c56d773ac50f2f46c64 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_107_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7b16097860a203b7d0058038bb8d655cbf97cb9b6704553702848d6d150ff2a +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13a97c3fee09208b0ac72f7ff33cc2456b248442 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6964caaec9b7b4dd01893cfad335507902c15c94e4121f6c3016e39649ba3c0 +size 208731373 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a61a6ee1e55002db3f6c201d753ce51e3f7675a9 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5e9f6b2b6ec3bf039214813a6e76997fafab24cfe34873971b0619ff11ba0b3 +size 208731373 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_108_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_108_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9af324614e82c437a61da1c6c88cc557ffce576 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_108_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f68ade7b87d4c06eb802e679fc123e2f11432fa3581b5c719e8968dc2dab774 +size 208732141 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_108_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_108_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d857bd0ce97fd4c55bed2c470f219c30f2e8edc --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_108_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d04c0db2f0e7f20498a561b31f5cc93f3243603cf27e05f376733601b8537d9f +size 208732141 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24d60647c7ebfe8b9bc1ee727cc95bfecb35c789 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf74dafb5c41c08ac9cdcc8c877f99162e8ac73b878d7e0bc01af28e322cbd1b +size 208731373 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f82b8d86b36ecdb16fde1e9140363bc4f285eefa --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:956d7be7223747789e080aae3a3bea74cba8e3629e783e6b3e8f155e188a5c0b +size 208731373 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_109_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_109_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..396fb7f9147a8fd49bc980cb2a099d46a2aa2e94 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_109_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c381f95d0c622b9b4767db8ffdaaf8f2c9cc11ef39d68cdfa60a22d6c9d3a8e7 +size 208732141 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_109_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_109_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7150afd9dee39556c3bbc04ed44aaaf4ec49d188 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_109_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1292d285e3e388bb495cc57157254d7926448bd6c5ce1e4003c6e3aad9ab0b32 +size 208732141 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fadbe43c7cf8c0634daf3f81801e117f016f168 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:599885f0f2a832c2cb4764ebded4e3f694063f71f1e680760f768533d2cf2150 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c74ff0b78dc3bd4fd6006db65ff216a913fdaa1d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52f7a17c0c6ee83afd0f156cdbc83bd8a633937fce1b64c39decfbee9edd7052 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30398d78c0fd9723ec909f485ca4cee974188e39 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0d63bdf9260a4f78e59432708e38803b9749706a068a760a81ffc73a02466c8 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a78452fddca27a56e6b8ddd40b4cf6caadb7e8b8 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16385994a6667deef13fe2a22a32d2d96b56b66c88ab6d2782b35c6243067947 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ee3af385e4e25989d8e104728e757a1f3de323d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c22c22a33888b0244bf00c9bca68cbaf937d3d426e63c47eb0fb4effa453d465 +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c103c055b3e3a52640e74a2524e02d6db7e3a3b0 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffab867ed81c480838072121856cea71ab10cf26a0143b89531b6f359522afbf +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_110_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_110_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91ed72860b8d68593be756910a50b158eb5000c9 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_110_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c419bf4caf3cd799296d8f739fc26b68248ce22ac0b7cc59edddeea57eabb444 +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_110_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_110_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f013d588e5c5d4f933415bd9e3a13199d79027f5 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_110_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c355097e2135ef5eedef5f9ba3214c3f72a8796b923eb6f919f7ed6a372e7fd +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f387d7d15138b98d56b6fc48362853f8121712e4 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:850d1fb02168798c3523bb7d95d9e15052aa37862e114d17206ebb81ea60b070 +size 208731373 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9e95836305a23401ba2f6e97cd9ea9abd3fa5ca --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11d87f5f72ae5ff3aa9042b2e4b01ca288a9e052b3484f9078031ebf5c720c16 +size 208731373 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_111_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_111_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e035ba0688a6028299e2f5e76633d216d23bdea --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_111_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f55ca4769eb8d24a6613849cf6909db11726d37bbc4e0bc7d2e7e70aa9668be6 +size 208732141 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_111_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_111_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9df76c3b60f8bab507ce7ce503f188dd53c8b814 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_111_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3487c9acb2b716162567de2a5246b8fedf502000613b621876dd665779da814c +size 208732141 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..952ded84697051d3dab75efc6e891acd20e72500 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d546b6c3f48a893618d1e1a55becf6a1f9387730f163a5dd5759725633547c8 +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..732d2bd6582264244042e60b4a2012e9054ed75e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb8a538f5137d87ac509e00b6cc47acf90989da5fed1caef5973b9ca5e95f831 +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_112_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_112_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62dc0b8b24db9667fc8fbe77901b95467528ac4f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_112_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d99082d0c166226e67e06c4c213649d909938c0069e2e3bbf9e5bbca248edb1 +size 208732269 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_112_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_112_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6e3ccbdf6b8f55cd17d27e99914b74ee2a5787e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_112_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:033f76e153b5b7fb54fa17a6d37c92d521c36ee5ebcc8b3af13ab1210289c96c +size 208732269 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86264c921afb1e5b7da522df6bdce8aaced307e5 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30eea1f70ba83e4b2ba26ae3f980cab350ccfd8bf683e0e33e90ceb3892757f7 +size 208731501 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aac18841e496984e50b48b74709b18bd91d7f99d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57afd5e733e329e4de62f8382b5cce0080d9d46f8cd158df9e69f5b2dd73a0a4 +size 208731501 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_113_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_113_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d545d0ecf310a0c221e78bbeea45ed0158ce195 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_113_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eb7efcb36861a637ef131935b296968ac2d89f52c9faf20afe71320672895cb +size 208732141 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_113_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_113_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35c06d503f8520e828a5ddf1c3809249f9d5e056 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_113_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:896158ad9868830e441321afe4709e9b0feed0c05a1a4730c3a6b0dce6564dc4 +size 208732141 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e758d06810facbf9cfd6980d8c3dbc031922e2a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd5103c9fb55634743ba695176f5e9d3e65673095e7a7f83db2a91be6240b058 +size 208731309 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77ef54ae83a7f2e71eb617a46f91bfc4f7b5cfde --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b89242994b989e8769b632d10aa9ea852186adb6c9e1124e9ff180f5ce404d8a +size 208731309 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_114_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_114_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6bf8e223261c4e4ead90ffc7c8fc4c041a1cb73 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_114_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5703d6baee9dd2710f715ecc32abc47cf1869bd393003ce15628a97afad8df6 +size 208732141 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_114_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_114_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c6d33475acdc37f808245edc87c9261ef40cce4 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_114_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d7c3790e1180bb33f25ce2b72a8006bbe0f6bdd6401f91be02c8d67e9bc1174 +size 208732141 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..546e5ef16e540f5b009848d078d3e282950af37e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0930db4442dc3d9e64a900a94d532d25abc4ad04e8f343812f4aaca4375891b +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8e6190e6aaabeed762b5051123df8d3d87f227a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa554e0c762cd3feada7d6c9647251026aedabf588146632e1efac82f9c27f7a +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_115_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_115_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e9a4da591aaefdac146808fb36a43e462eb8054 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_115_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d19ae77ee0873b1d46903161437b39e5772da4854b74717fc7b325dca4a952ed +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_115_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_115_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbcecce32a1830854fbe1b611274d529fb925d8f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_115_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:063e390a41043ba0a3184fafde434238427869411962ad9b3d1b678b0d95213d +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00284bb325991fc88be8463560bfd39f220323a8 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:675fec8ffdf689615bb9beb79eb47c8db1246ac8acea1994531b9364770e455a +size 208731501 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e923eb79b15cd7e1846e838c71bf1803a7e42b24 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faf4de40c30e92da54cd032e9ed04888ba44c4d73dafbbf64d809d2f1753b9b6 +size 208731501 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_116_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_116_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5707d03cd7ea5e5034b17b81df0dc67d17dcfcc7 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_116_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8b7a3d025312bb37e8e4330f1f0e2876663a0738e1fc0a75379a380aed186a2 +size 208732269 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_116_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_116_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d5b8fadb32c7611a5e78b3a7e5923b2fc6d2a93 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_116_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:859a81b3c3836416b3768f431c14d8250d7b0fe981769b6f4c190aeaf3e676e7 +size 208732269 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4027f200f51ff14cd3c67f803857b098f8cdf32f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89651d42ae79b52f8f061c6b7dfb60f5114e29dca0f2690c1007915b8798ce4a +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..060e52916097393fec57d258918cfd9857ea3809 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd6ee4502c101552ab30c9ee86f962dc28766c780efd5009beeca06d47ca9667 +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_117_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_117_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0adc565d3ab41abd064d3d1d4dc8bfedb9471409 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_117_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:872eb307b8d28ca0ed7b0cd34493fbceaf903d79942541fd0cc3a9f4bc49d049 +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_117_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_117_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ca4a73d204c57671bcddaf490c5e7276a93d0b9 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_117_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3072ac4f3849798196f037f034688033759d6f699113938dc296991e1d6b58fb +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49fb06a9d3c8a332dcfb80660006a449bf151bc8 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcb48f4429dfe90ee9bcae8c84f4d08e0ee8f68d6b5baae1ce563c8f3577683f +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a611996fb15fda0819bc10f32f1ee307ac293728 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43b16352a8ab29a4e3f16112ebfa31146faf913709cea6fc10377996c77299ca +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_118_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_118_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e55a56c173167c7acaff2182c2caddff98a567b7 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_118_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49d85a5bbce7579f0a0221324d0207a3d112b7bddb6a4cac0693c142d59bb19a +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_118_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_118_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..127cb4e0eb39c33703cd671e8991b679d7da0a40 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_118_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd822293e497ca069156df160470ef082fa2cce861c71d89719d6ac5f3b4c45f +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a6fff46530cdcacfb60fb1a00b06e3729811ee5 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb7de6a57e42cb7e37e4201027ee5766f7214696e8f1a92406530576541f0c00 +size 208731501 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe42a92676092847f172c9e7ffa67ee732b9c350 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2869dc83c7a875a496d8a0e9779ba32ddba12757ce1652913cbf80642451db5 +size 208731501 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_119_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_119_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2de6c5bda793f968cc60c8e8aedf3e041eea5deb --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_119_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1072329b7df58623dd75478026cdf17b9e3599ce3c81fccab252f7aa8c601a80 +size 208732141 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_119_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_119_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eff47b08130fdb5821bf077488777e7f6dcf4988 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_119_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd4fac21cede0cf590347440d606f88e847d5dc479ab673cbdb75b86e8f324c3 +size 208732141 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35f8f4e9f2a77ab7f7c0d60fe52793679356ef37 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:164598f65b842aec01248d331362e9229ca1afb9d311906df4f0f1954ef60b5a +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a395fde7329394389ff3075d6f7257f09806f97a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84d9c8cbfd62bc41c1f10c2649500899e9610d73e08b6f9eed7423bc124ef214 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ce53c37aee83c7908cee84abb36a9022a5ee241 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa5b638175b5e6e4b775723a0aabf775529c132ee1d16ad78e7edd4fb5ca223e +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae7fb86c19574753ccabc2e19918b49d54688396 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d35768e2dfd551737f51e4666d266b7d0f2f09929979a1eecebfd091bf6b2ef6 +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..006804fe9616e38510230f8c0e2fc0c204212882 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d7774ad63eefc6b3a7efd29a281596c8f1b2bf2050b5051a23357141eb83ff0 +size 208731373 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75ee681e4496ffb99f80789685010daf52c936a0 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:351e5e7eba29afe9f8e5198ee48836b4220ed1507fa079075936a09598e2391c +size 208731373 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_120_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_120_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d7ebffd706c00e182fb7d42af643fc5a66d7e44 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_120_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1d128cda3e1772a61f2f70942b9613328998167b20e1b6c46132b2eb6a7c184 +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_120_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_120_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4148922985bade2d36f5d6db30cf03206bb60ae --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_120_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54cfcbd267faa8dcc8f7f5c678f977992cc811501ed37411bf17f70b2de7b135 +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09f54845441d5edb43dfcd15634bef0741e281bb --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf6021e34c043efd71ce80080d542efca6d4d4a1b85b59a4583ad894852be213 +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..379d7e8df776cfef47234110a4daf3624e4e3ede --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7e60350bbbee021e267d1e282627d33f7c60489fc7db799b561e98b0889adac +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_121_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_121_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cca241ed71a5418e97c779af0265793d18a37070 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_121_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c19b86c92a1ca02ccd88969703429b28f04853906cf9bfc0bfd7c14d8ae3f29c +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_121_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_121_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1855232067d8d1d0c5d1e09bf2ebc0e7340058c4 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_121_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10b2d3227fc56c6be2eb0364d9e56c17c24cf144e48bddfc5a84c0497b5d0d13 +size 208732205 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b0231411665390faa119124d056f06ca93a4c18 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99d2f9bf11dc8bbe3c7c705a858550a6d0310cbc0c1e7935f98346abdd78038a +size 208731309 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40a04a6bd9e9c37ced2388dd4feaf4017719a5d9 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a665ba5076dc4ec45739fd0d75c483da02e1feb6bf5b7b18a1d3b7168a1042a +size 208731309 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_122_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_122_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..162e97b1e3e98e873988c7365d3a3cb9cabb70b8 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_122_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73e907037cc65d62b6f69b4c63d32007cf4cdcd4d5a5a8f91542620c441042dc +size 208732141 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_122_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_122_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d109a18bca9e6a02184673c7652787e5efc4a622 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_122_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14a4467e0ae95e612eb4952c3d8adc6526094e59b12adec74be5bdcd5084d531 +size 208732141 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca51bacaf7082b94650e1cc90964c9e8c4d653f2 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5893cc7f59636700eb6036b38c194ef15aaa897d1bfb40adb96e38b9b37c0200 +size 208731373 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa36bc73ed6a85dc35f026406a44b0350359d88e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b311478cc772db362991b62742d8c1eeefd40fb7618c7922332f727d7bfa22a +size 208731373 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_123_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_123_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9393d23bb2d4f2b1d926c21b7902c46061da292e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_123_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0169b2e236ec64a621c4ca6210c5e4537f7e685415a9f0d51e343462d833e315 +size 208732141 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_123_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_123_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0108542bda7596fe6ae10e3dd299700c0b6a7fe --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_123_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77914dadda58c4dc187b4506dd3bca34f05124907e371d2dc8b25481a5b6d540 +size 208732141 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0269d2fb47b878a70f81181034ad14481e008b0 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5c8d54ecb5bc5a83adf4ef8a8d607b8a1095dbc91746d2111c0e1084b741209 +size 208731501 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e9d375cb25dba00d428d62260442f8d8bff2637 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af6eb0975f9704f38a64fb82ecf9e8aa979012ed7d92b91639fbcd96eb8bf161 +size 208731501 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_124_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_124_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1e663ff26678599f32160d0d54691f6f9444c7e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_124_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:986da8129aa6157c4e09a2d443423f55dfda503bf6ed6a9fb389c8afc13554a8 +size 208732269 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_124_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_124_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69249aae41c16657831aeeab800cfe496933fc2e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_124_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63d68f5a298f10cd91cad9d7fea9bdb3fe43951985bcb379d2d6d9682492d572 +size 208732269 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1d681d203bae07e3d0fe4b9d3e933a6db19035a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96d5f0dcc77bf741d64d989de97517641ee7f124cef345a838cb0f0fcc11ef8e +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5454a60b86e75896e5c4adffa57ac0c3e779d119 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e6bfa66b03b0923cdc47cffcc845ae9f108e10aae1b5800f9427b965f7bffc0 +size 208731437 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_125_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_125_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cd6f91cc8f3cad3ad23ded95108ec8495be0798 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_125_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a940d23865dbe70b647ac6e64d0d2d14c64bdbd96697c4b1835316c3ab166203 +size 208732141 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_125_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_125_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4566c7029119b2993f5881ebc8850d64fe0c3e4 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_125_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f9c18caa405b3e52c8bf6bd9c3d655ec0aaaca227516ad81c1fb02a90657906 +size 208732141 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf96f51548e3c0b4cbd54b150409b84e8c099807 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b342c53a4c98470be2f4468abb96417257777b2ffd72c6cff17bc7c73ffcada4 +size 208731373 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..650f91f8f48af4c3923a1571a1c2101cf4fb6789 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:152b6678b31e4aa7bee86ef7c34125fdad78eb39998220e22cc36d367857d8ee +size 208731373 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_126_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_126_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99ab2b433156d37f531aa84be6bee68da14718f2 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_126_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:671e523617a6af4ed8cc249ce8190b35c34ff15b3485d74879e68dfac1f604c2 +size 208732141 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_126_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_126_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30dbf08cb36259b2221759530a687b0c164f9851 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_126_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0715ef680e3b76851ea2899739210ceb25c52f5c5165a42d05242177c7312464 +size 208732141 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e76a926b2348be6659afd7c620d810fd5ee959f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f9d974b39622a0af30c81239d948e7fa1e3b87ed4439f606add742deea11564 +size 208731373 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f612f2247ed4a8928c2e4f427c6ddce0edb48a2 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:448ada3e18f691e1c8725fbdc931fee583e25186eb63ee2eede96026d4ca8cdc +size 208731373 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_127_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_127_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fce0cac20793ef2f064f2a8e8ee7056910cb3a0e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_127_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8414a2752ce01f1d933e829278e423ab9cb930372eb90e7bb5f05223f015fea +size 208732077 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_127_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_127_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0da8df9feeb4ed2eb405d302c5a9c2735918bc2c --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_127_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5038047d27915682406f38d2cf6b1e551d3a7df18f7d5c0a7cba5e375a21223 +size 208732077 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d318203bdaf98815c24884a5c03b7d4f611d8701 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:121faa790ff38e46194bd68a979aaf5ed1843ca5305d7f6f09e6b0d52e212c93 +size 208731554 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03db0408200e4072935f53b038ff8cf39c02dcbd --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bbe21737e7191db65a86fdc7d5ccca4a67988028e2ea82f754307c6121fd3dd +size 208731554 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fc2b98ebe08696ee632d3b65f760e9c9fb69206 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b392597b644293ab101c4f2ab36848c14c14b01592f3b4804164cdbde78f8d39 +size 208732322 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..384823375d46c219cf3f9e23b685b26235b4da2f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7812f0b5a6e7dd4d637afc68ca457f16c9bd7b7be218d2ec4e56ea45ec2330e +size 208732322 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c14c106d8065316711cb39f3778cfc716a63c38 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b5b20dad73ec73597dcdedbafdfeaaafb013dfaed5b0923613f86f3d884b9f9 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4cd27e5ed878e4c4b884a57b1573517a4ce928d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:846165d4b040d56ebadd70a32ffdca8f47e99b4e09cfaa25ce62bda308893a0d +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..236e33493f137a882b6c61384d0331e2439ff928 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d071117435e6f242bccac627a9c8f85243a0146388c0c7d947f25389110acbe2 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0089db88c7f8ebee3b051b3f19459b45b7910a1d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a5e4dfb7f241b4358dbbed69b79903e3d95f6f88444fd3d08a67c1cf0f74fe4 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3459b220bcc1772b4414ef6ef4dc786a231f0339 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:449d2856e0d16d38133009b34921b5c830b984c4441d2a38b3171073fb0260ba +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a120655b6b73db0dd20f4588c5e4b19d29b1d200 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01f8f590f1a165eafa246aca40b5a97cc7e57bd03526383ee2b2b3c43d71aca4 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f04f6a4768597a5b5ab226684c41881d12ffe3ca --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d76e74f84be452dc9a43f91c13ee45b5d53a2cb0110e117a48a8c3c620aa5aa +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40c84c0d1e6c9e40da7c1bd8c39f4b917847de79 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e3852221adb709985894cdb593f06c6cbe53bbf249214c390595407f1d89202 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7f55ca80615aeb1f0e46da3793daa805885577d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b240d45032863dbf04b4027dbd6419ab8f0b8001b5b06c6bb3b7238a4761d32 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41952176289a5c24c832539fd571eea83ff4da3d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f44366c074ad936ef401433d395b3aa122fb80d8dddc57483f47c0224b60dde +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..546f4d547f9938c9e5123a48e58e11c2abb5755c --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4f4cad01a16a09554f3588256c74e9cdc9f964fabacee706ca4a26bbe8a7f2a +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..faa25c2327382c6ec7a170f584b80a6a1a45a8ce --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:406ca29b818ae39565c38aead72e34dd3a71a9e1e062e5f8be04885d8cba26a8 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5e0e111e13b32fc90879920877354e53177c843 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a8e7c3f4e949a69062c9ef13e8e8ded31eac0383a47d4dc23228f065242e91b +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4459114241de0aada917c4a8c25072727e58ca29 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21ef1a28d1b4c6caaec0d96f9e18e9fb17082d71a976127751f384ed05b05987 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_16_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_16_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49a905b9ea14e4cc3c6d28d01fc6b4a39d2491a9 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_16_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53b672748f650de8a77de33e3da5f2f2bdb8b281c7b5c02626c24a898752239a +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_16_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_16_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..311209c57b689d5d2281c2b1f064335dfb14d7d0 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_16_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37e3f0332957d5638d4061284be86bdd2ff56645216bc9777ba3102cf17e974e +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11a3348c3419e02ecea8d5ab95081edd4825962e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e08995ace8401ea2a088d5b7dddacdc2952e9f0727174fc798243dd544407f1d +size 208731298 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3f3da2561d7e977e874074dc58845ac4fc5b3a4 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb8c9105cf0ae2f66ff125e182b8548095a59ba8a6491a22065dc5245e7f5ec1 +size 208731298 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_17_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_17_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9133703849aa832840751c0458f7270674aee6ad --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_17_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fa9f44e83adf5d4639004149e185fec89027b8be228f263713c002da0d2af41 +size 208732066 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_17_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_17_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20499bafedd338a60c1c099ca368ebd118d4cc77 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_17_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:980d4b0813955b37f000250cbf13dcf0975b7d1759cacd9f32a77d9967ee7dfd +size 208732066 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3c5da33751802b994c4dd6d2779de44e646fa59 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf530b3d0797a8d55a78ab4ce73b269cdece42e593531d90e6b834908170922c +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42132f98058724bb59640c594371e5c0b3a7315c --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05d5dbebc7c7750c615d20c79e1044a22bdb44715857de245792930138a62acc +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_18_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_18_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b8cceadd823c6b2dd86afa6a203ccf53a4b4c0b --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_18_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88d605cef3ddda2a50a53c3fb1061cd8926d91deb2be1a71dd044fa3b1160790 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_18_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_18_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70e908a675254cbb996fd537669bdf55584bf330 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_18_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87c997a20e511bb296aabdb90c1cbb643d075fe42ec7ac6332ea1f00c3ab5c96 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1ccb257d00889f8310369b42421992a02cdc813 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74bf4cce7b5a07e889c69d830c5e38c31447031076ddec7eba5a8be340af9b3f +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b71b6983aa3e2bcecbefa2a9aac0a5c02668df9 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2366c743345ce648e89764f2a88eb2851ac15fff3d6dae8d4f05711463451fa6 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_19_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_19_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4ff9c069bac2920357c1b49ee0a675ff3b2063c --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_19_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fb88ccdf3f3c31fc93f64a1429974cbd48feeb151691e7797e6f12b80255f4f +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_19_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_19_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d74842bb14abb44dcd8d96fbfd36182115ad410 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_19_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:493d7c024c5a6a91b96510c4a0bb9b1586582902c844c38ed9ca114c6f29388a +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..552975055f0ed698c6605dc6bcf8fc1613232b2a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73c7bd721c0068009a2cdd16cee29e0ceb19a57a11677e09a7d41aa3f80b5f87 +size 208731351 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ed9d8ed0caf3ef3775007873c4d59f8365c0c79 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32c7fd56f4a493b02b9ae864c0195883a5e98a9abf99a5c7aaf191e09b97bc25 +size 208731351 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..880e06d5f0e6410ae03307ef7cce5d551522848d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4298547215785ccb8cf008cab4db70e5ef16fd5e99b7543281c296bd150f084c +size 208732119 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6c13a63412620bd092a73ba7d5d5be593e45857 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:340930d6c285985b033db76e92ce5fcbdaa80e5f0b6e268a660dea9043fcf75c +size 208732119 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2f2983a6110bca5779c5971bd0b592c89e25f92 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c96161bf3221984573982a6173ede9479c134499cb36bd9fb3f5d1bf18805bb +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7bfcdd6bfac29afa9f3c2f9d8cadf89603fe1df --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3588d565fbab6114a7ea58a7cd9042dd935cadfa62cd7b669fafd7000ada85b +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_20_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_20_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c85bd0701a0f4d89258d01e171aa4861191e4502 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_20_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c7656333539d1049cd810bbf0ec1fc596ba2edcd34b48683641b6eb5d4882ae +size 208732322 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_20_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_20_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7fc7b0119136794a64164851745dd3c45d972c7 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_20_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:532172762f3831bc59c742820ec17d19096666e1599b05a4f04bd8f4fc11ead8 +size 208732322 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e81aa8ae69a80790aeb01600a8fdda7b341ff4d7 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d54e6656bfe910eb517411dd83e4b3acc3e74e989866a328dab89051d324bbd +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb0ef55e65ffa5da4826c5f8c4214403d47c04e0 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8329c502e6d9c68488371f6ccaa41f0e5692708b4b2dcbb65154f87b82c3b12 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_21_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_21_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..360cae993de5a277e52aa0d5d3abb652846ecbd2 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_21_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ec3f6add8624a150a4abaf08555b9ca56906aceb9824e5a3103fd96edff3ba6 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_21_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_21_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fc8c11b68c2253964574bb94f198370e6530476 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_21_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fbf51b1ec5a02c4876b0c7a54bcf274fff9588ffe55fca3bbf363c07aea14dd +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d1cd11a80bfc2b0144b3153abbdd3367d3d3779 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4412ad4e6b9b0c4fef798c5a0bc8b849965ede4d3c46c4bca6fd54659e9da105 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d20c607cd65632c7cf281f3d6935a5a951ee03d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:840d5020b97e1c93fd62da9c3bbb7a89d82f3fe773ef75c599190e08eeec7dc8 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_22_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_22_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..570ccba62b73fb60f7f2990f5980845aec2cc62f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_22_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25b3c6199c358b102b48e6b794bd2e5cace83115f23dad08bb68b2b6c37ed74b +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_22_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_22_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e2d373508c5f0fb7b84d73d4a7b649bf14a83ff --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_22_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29ba04a4bd79698534bb827ca20161ed96a0c24c75a0e5d34831e867406560b9 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3270c035e82694c89b3859184339e6174b736afc --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:632caad7155042fef9c2c759bfbe629df3766729fed58a742848c376998b8c9b +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4c453f3cc43025560f3eb23054c372e02b795b0 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03774e607eb3ca7e4f9d71b7db31fe63d282a92f6d9066cf883c0a7acf3df958 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_23_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_23_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a81619874a1e355ec04d88527db2bc8002f1e986 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_23_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33a97445819cb45227004b37ab353f10c054b0be9b93c9ca3f2708839095a418 +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_23_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_23_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91e9fc7ab9ae8683465bc3f24b1601085862c41a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_23_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e93b729b5e978806a2f47b3b66785ac928b1b0cddfdbd76fbd9be6797cf7e5c +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7e08797319658e2934a6a2fa253695948ea9168 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ab1c2f5628c0d6fdfba3e692e5281a6bca85e57be1942adc09228d41ac4346a +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09cfc948e57d8234701a4033c70ef6292ed6cecf --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f572c56958319dbdeb354b795541f0482593780a610e3c57caf553ab37ba8fb +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_24_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_24_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfbf81de47c7d54bf2df9986322ae3f88515ae59 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_24_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c73caf02a860df139dfc9bd2eb3166337305df958fa597a5c8e3a35653794cc +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_24_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_24_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46b898d561481f361c392d80b2d58ef834f518cb --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_24_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ede02113861bd0e61265994cbfb1ce25587d151c73315017cd129441465974f5 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87ff264f0615a4c9154120ffec9f428fb171c6d1 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6396b1e191dc35854401d4dbb11dab6e07202a92b81939f85dda8ba2ede30978 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6fb5fa052c24f1b98f634920eb8888f4e64ffd8 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3a73b335a60e308973820bf48a01fc5eeb4a57aaadcbb933876fbeb2d2838d6 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_25_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_25_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1158942afddd67c5314d0e60ff7a66feccd855b2 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_25_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27444cbf02683b25c42c94024cf512bf4627a9fabc941b8ec44262b75d2f1aed +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_25_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_25_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11e6c788e2ccd669f3ddfcb51296f8d7b247ecd5 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_25_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6ff13b20d91f4fa94da667fc11208aa59fabae18ee6008f459aa6b6568302ff +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6718db445c02a72be683cbcce2563106a4b9cf8 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d04596fa18cfcd5b52e4c9936471d4752c954ec369b31c22e829dde786282349 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28e13c8e0655310866f92113378868c116f6e476 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8c9a274321281d220cbb4de121763394708b4b48d62ba4ae5381385c1c3c451 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_26_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_26_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..292572e518aaa0b8eb42b846abc77de44450ddb0 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_26_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7be1b621a54cdbf6c06e5427eba7f5c925fbf2bdd8efdd09a944159f7fba2a24 +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_26_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_26_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92462ce6ae2bf4dd4a5878429760f14d53b1c17d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_26_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5cd3a7f74af6ab19d2a0add88a7d03975683a5e294fd33b1d0e7ad41bdd1c4d +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fe2213929dafe21442cd827745a894f2648c771 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e32243c41b4a1ae311316512f9918b53ce0a2997c5957c9c398effb9af5e524 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c21789b8fd7b4c661dcf7bcf93d1c5e73c4d5827 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ba0cdfe17d12de568a7eb77ed002a3a22366d08f4e6c2c5a11675b8ff729aca +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_27_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_27_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8f5c2c3c452a7997d86d9fafbce5edf6e4e45e9 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_27_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:839a211b85ec27886c9b9fab0b3280c0168de60843fb2a7617e98954c7c93a31 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_27_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_27_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cce99ca2be8194d4a70ac9c76dca1ba069125dc9 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_27_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd9d904c7bccb4bf3075478f4e1406fc46db2c7e067ab64d2b797207fa414589 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d182b12de7b8e571975c151f771a7165424b7ba4 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c52c486df3a4d0be9eb5ad87652d0e01fc4ca7d3f8fe9e5b9cffece2a57904a +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9fff5b4061b396994d8d05642da858feaf3f2c5 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe02612aeb686ef49eae18b9cc93a1b876e99f348cdf9bf0ac61084364819994 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_28_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_28_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96272cdd29945527f15cdc9f1a397d06ba93270f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_28_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f8727daf05c4ea8107e7a1b8eaabc956a7ca7ae80457955426c8bf1f12717f7 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_28_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_28_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3279e4c8f70f1239ffc1a8a2e5ebe87706adb34 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_28_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad455c158378da859d83eacf16b8f98e6a826de70820294ca9845d77fa4d9b0c +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c81e9549fc573b03c91d925fa833a527956f5a8 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1ba67930044873e67caed7e879e2c7849625b62490e1cdd7a1c7634820f3d4a +size 208731298 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aafa40e3cad6d4c579b4d7ed79b63287255a02ef --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:079f08ec68c18d084652291630eda280a07e2e7581dd5bab6cbd979e4fa5f56f +size 208731298 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_29_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_29_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc0cd9299f2769bb3976d9c061f64fa7c99ccfb5 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_29_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ea58433a4df1b731950077a37bb0ab24e69055547448baaa2035ca66e3c4c61 +size 208732066 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_29_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_29_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3de311a949361f512330c45cb2a417601b29eeef --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_29_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e173e4e8c2b8b8fb622087db2737a142d453751cd5d5347d0b935e26388210d3 +size 208732066 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97cb2c2faa1dd6757e6d956de687ce781bb6880a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af861bfbf446ee53b7cec90dd3189c01c5871a32004bc1a2a9397a0d7e785354 +size 208731415 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b9cec97a539c79a29aaae1ebb67aa75b028f4a3 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd14a661aeded7cfcb9dc178dceffdbbd412ee703d647da1325102a39a199022 +size 208731415 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72be0b9bbad31bde352c69f553feb851a5ea46ee --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:748bd4881fb5a0cf221af2f6fd807d54c3f3343a8f87b001479800647d4eec56 +size 208732183 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b112e13646302f69e02ef35b68ad5871f010bf8 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e97494a765be0a808a1717c2e31557daf418c49e6b5908a8a041c17cd0605cb +size 208732183 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72e988daebff27171a9f320af31d679a0d82feaa --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36aaeb3281e1298c82d03aca66e541bb9f5fb69c02d601c1ec44b1785f8e7db3 +size 208731298 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99606a6deafcc79e9a762c0ad8e8926f825a590c --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e5c68684a2bc3037e2fc252a94d6f31331df13145c46d879a52edf94b1f9d47 +size 208731298 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_30_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_30_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07c43c2b3bd65674f7d58e285153c9552db17aed --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_30_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa36d0113248889f05c13f9235490ec1f7767d1219d5962dee5bc49cfa7dd2bb +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_30_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_30_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dffa6e82a3f6455757dcdd18b0a595d59cf0efe --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_30_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0c57bc71ed98b4b0b087516789c6be1b0dd97798785abe81f37bb481b348906 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae50e1b71654761a5727825377b92c2b1e2d559d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:925e425afb5959e6a7bf660ba94b1908a779129ae0197e030dbf504d55f08429 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fd14598ce48c91ff2383436013be4702142d8ec --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a432577b1f52f431c785e7ede57c5e13f6ea3327242a4e27aab807ded4a41f9 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_31_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_31_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed6f3552b02e91e7e75334ef116ad00e87fa4e09 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_31_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b38b6e52d701082b99f5d3931e922fd9dd95acf9aca7cce40a6b4770b5bb52c +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_31_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_31_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e562d809157c2b1b03f64850e1185462010fc461 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_31_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2ab1dc4de97b1cf72079cd67282766f0bed658e39ecc29bd2fa8de9d3e36414 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60f52a24ef63190e70f8e2a8ab07e61ee170d746 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0badbf1153f38fd58585c7fb8d710abd081459725376f44e9465f3865be7de64 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc4f13409ada6b2bbefa7a3adc29767d8a3fe404 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d8ea52ac505e3373d2ae16211bfd80b8bf2dba67cdf16ffa38516c64112da94 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_32_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_32_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ff1ea95c4605b01edf9b6fe493191e4af1d8368 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_32_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bc9157516fc8888e24b022dba43b584e0077eba69c312fb55d07b73ccc9b626 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_32_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_32_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73755deb4cdfb0eb7f7907b28692fe51f1ffefc6 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_32_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4679eb529d39bd59b0ff8fb5e31eaa73eb9f4dadd478b6f8ae5a339ccea808c +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfb8e24cdc688525565d5151b4c0b7d2471b582d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42957f5c76db4d2d93140e5e305e14c573cd0cd7f586c7e017d82c2cb66bbced +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ca9aa2813b4bcf500180f9c8536be8b92946921 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1b2188a59dc0ef2f5819aceb5911b452a8932eb789e645be581d019d8814f2c +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_33_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_33_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..818b010d2da55446fca10502467283fa0684a185 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_33_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75fcfbdfd77698786e8e3daff88cb20ba87013db93af2a297b18756d62424a5c +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_33_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_33_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d40e4e3231b434b4cd147287a3dfbcd7928a0079 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_33_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a44d3731f5171e532fc6941944af8884b566cc0c778ce4732a13b86bcd952d5 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..809cc5c236e040dd6e16d4076ec3335ce37ae4f2 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00418b382f53a8c3c697a3c96b612e57422a7cc25adf9aaa2fed7299331dcc93 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d32311530e0ae7747d25ec2f459c7acd536afa80 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ece6a9a39a19422c407e902eab21ac454e429026e1fc359c3eecc4ca2390eb6 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_34_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_34_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e57705d733decc06aa58ba0ba23ca847f0cca72 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_34_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a92272f52e71a87daecbd5edd55096414403baa6bd22d902389e12634bd13a2a +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_34_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_34_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..903a23a2423bff98b6f08a9edf5f4490b712bda0 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_34_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0379c7a6ef48d396502519fa65f31ffa0e9113716533355afc4a1eadfbb2808 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4e947f2aa5466adfcaade8101cb4ba2393ea4bd --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d6d0f3f6527b2b24075d4d361ee1643d1b158a03d4b7a24f2b7d1e753ddcdf9 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae9a14bcea091231eaf6429ad241bfe5b95147e0 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5adcba600beb7d339079143c94ba7a9ac05f10fcdf5bedc07ad405d9e87dc7e +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_35_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_35_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e766a625283fd1cf8e971af96d4ac46d460f848 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_35_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7abad5f32cd88630b7bc33e627c69b0cdee5c288cd53b12d42e74e96ee023111 +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_35_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_35_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..338592ab74df25d935a5c65adbaedbbd898f44cd --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_35_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cd835af6ffc2a48a466552ddc753a8181ce1957ff01dca614302f683a96fb49 +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..284aa3c4daadfef8b414506182a7d7be54b051de --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cf9012e8e0c1d857e042f27fec63c753ce0662669665d8239e1bc197a743e58 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a957c629d6353432180150495cadc995dbe9dc9b --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08f7711709ac151619b06ae2905ff0c8d19450da9e1bf1afe8210f1a5a32cfbc +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_36_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_36_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78a38a0539f631f242e1e5906e05f634149be634 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_36_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e4f757591215b5f90a7e0346f81d595e2cdb1ff1a68530caff04c72ecff62dc +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_36_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_36_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6eb1ffabbeffa3575d68447d757e5c1474a7565a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_36_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24e9b7cda2bb3fa81db66e7ef1e87c4d32f693b4e319c178d2528f4391cc9158 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f6cdc0d22fe3b4a4f9d33450a5c07a9f2ab9938 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c5a0152cd7444c8ec9abf14580617d0c731d633c004704b0ce292d7835695d6 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8362a1e6137a30f94095b1e819fa9b891355b56b --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dab3e6875be9716d084fdbca3b5d40f05aaea317e2cb66727aa07e2719cf08a +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_37_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_37_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d5df87bc91b6277b39991bd1031f3e3ad32f6ac --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_37_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faeb7e8c0afe158320e5c4ec7410ccd1d03d41a5c415e224fc53efcd52a59e18 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_37_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_37_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39f14eaeb62fc1a9ce98329d3c736f5b893ca05a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_37_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48484a3e7ca0369d552eee43d72dc04cbdb12e11b2e02705e70f19e93748f52d +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fbf29a8f563d092d104aecdf2be8432be739144 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffae876fe81159d54a56f334d7e7b940dac2bed543dca8fda072b6c98f852c24 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a81e691f1f49d5b371c3a2fa48babd21c5485e7a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cadf86ec89a009a5149884b3a436e59457c012a68850fd192b187c4a90a1f941 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_38_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_38_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30fd35a6207fd176a17f4a782129b71fc303cd8f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_38_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddb0f8cc15fb26ac6a94833e2caf0b6225414f0271e0bff4fe3af7fb3302e1ef +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_38_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_38_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a674b9185783ff26877807b4e735498d365c6865 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_38_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bd1fed037bfe2198b66f33be031e8969104d6bbd7ce5b10f17717e5b87c0f0b +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e5e1c3aa02d99b4c149054c12dcb12a6001b334 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7fe7e0f4713629934f938038032e87b0372d91a7828614ad0f4f5faf76dcfbe +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb953b41e047b56cd1e7cb73fd1650c04ff00863 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00ac37c584ea236dfdbfeba7859fff5c448f2f5d5e44e2682292486cedf30ffc +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_39_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_39_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83293e963065b559ca1b8e6fc919c4baed9c86e6 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_39_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3b57824ee6355f0792067c4091ec6046a0c7ae94430f0b91b64a42ae8418101 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_39_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_39_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c49e26214ef1ad5255c05c529cd36efc28e0b45b --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_39_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d83b09f12b7c86dbb7e178c5007a5ad4a4046729f8c472dd2f84edd713f8eddc +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..428c6cb40fc06f20f81abfba66a85a520497d40d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0cf65e639dcccab61f03b077032182fb6911f1f3f94cd970ad58fec06d844e3 +size 208731351 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48e697b4acb55e6af05227d97ddb978f22e1c5fa --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f8057009ff201d3b0954aa63901158971737e0ed7fb75fe3a868e9b539edaa1 +size 208731351 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ccc57bc6a7c69d3fc6e2fd09de4ea1db9e5b03d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ccf0a3e9a4810f049bb05d351899bfe84604eac7faa985ade919160fe1a3c14 +size 208732119 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..baf2c875d8959b10574717fa72da6a7139ab43aa --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd0f79d6ab2e5614cf3a5162b7cbf5989e974ba1371ad3ca4a8efb30eb0e5791 +size 208732119 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2fdf412ca9a4e1d481593bffcb5216cb7633851 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23aa919fe797adec19c840e7b05150e5f60fd5c2c4a445ceaad6541eefaf5f4d +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ed3f14c709f6f87b4d25a477003dfe0a68b2a33 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:269f4f3e31704be7e03aa59f0d9f28ac3a26ad5963896a927e7ea962c2b29271 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_40_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_40_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fe8c0bc51ebcf95a5daabf7c47da1b7674a5734 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_40_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b888e653a00c2ec6d3ac9720c5f528f4c4d3f2fc53f2184d4a5554e9eaffa38 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_40_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_40_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a95d1f626afb23e0c39cb7979628ac0e603d4d1c --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_40_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84de38d4bdc4190ac2ed9a5bc73964be0b28aa8ea4ad5e6c225c7834b2d28699 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3448385f4b9a468b7f8d8a2366ff208d2ccc0d59 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33db240e80d5a4f44372494761a21d71e15b52768fb636d185fa0854840b89ca +size 208731298 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d0238b16e11486cecccfa70d62dc35404beca52 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efbe186a83bc067898eaa264cc62071cf8a0634273da1a41a394823cb80aeb85 +size 208731298 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_41_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_41_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3b8cc50c0b2f24b8b265e689cad7c60a8afe5f4 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_41_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d69e2e9261fb9f8bf8b4606b5cefb32f3ae18cffb744e26f294b16271a2510c9 +size 208732066 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_41_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_41_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c9cd0a5ce0811f3114944c58fd2219cca245dc0 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_41_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cab5b5acf0ca614c9c853871fd52a8e864c410b16cd164c5b01ee216dad8ff28 +size 208732066 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..873bf23f6b0060ca0c491df68b724016a7c24483 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f8dcecafa8c738a73224397d6e9960749a1a3a59b19c42d49fd79223a71fe9e +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b328ca60b1d2fdd278d3457890163230541aa85a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1ad8f65e1df98675a9c0adc6761f6ea22d7d793726cfd994630a300b1e6ab0a +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_42_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_42_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed22733a7c7bdb3217a18211a4cd6b2bf55e7759 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_42_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9f1fd7a681fb9d5b661fe88f12af58ce21e40d579b3f81c76189c9e2122100a +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_42_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_42_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab6a1a41b7c137ca4a0814c973337e89954a5643 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_42_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0951715dcf38289742d1b3f08f94b1f0a4e86e2f617c8c228b3313ca210890f1 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12ed9d4ecb5c7e93f6701f543fd396129ebb9af2 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae7ab14e7ed4aa1b3bf1ea06dbead12ad7036e6e7f613231f9071de823ece5cb +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9136939784715be3b887dfe7fce0d86833a95d11 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e717c54c28a2a41553830e7b50d3772c32d408853d496cee5be1e3ba6bda069 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_43_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_43_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9122721366ef55c6b5569424e38144c17f2acfbb --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_43_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9df5bd6a318ec515038d8fa31a714e872036cf26db64ba34a76655dd04927fad +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_43_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_43_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29ed58aaf5eceb630075ab0246c9f5f2b7755ac1 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_43_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:172dc128d0a2203611230c1e203d6dce625637b4cdd9de2cfdd92b2df4f80e78 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1bd7d6411c2fd547ecc7cb3671d01c2b3525fa2 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ccda2269757580b45a02b80c2800d0d55f18c258a1e5678b88f739a7a80d2f8 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..acb3d7f00011366c1b2cb2aaac023ae8c29b6b6b --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:506f72fbe9494b909fa9b4960074ccb633a2b66e1760d8ca299286b197d8fd20 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_44_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_44_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c4653f3038f30812e39cb846bc0c36420d665ec --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_44_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bfee8d01e797c06ab9e68e10bf114864fc8ca3ae4533451ed0a14069bd31cc9 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_44_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_44_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..587f97d2b4142bfbcea1af69cfdb5f1ad40a7d3b --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_44_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12bb099b76441bd0a4e66a8cd9297cfd2c89509e748381f61dfb974aad326cd4 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14672f16bf0755f28a208f9ac933a70e11696169 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:734996934d674d1cab8c674230d131c2dcc238016834bcbf79a18380febf3e45 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43aeb9e5a3e00755a5f7040407ae41d693d7d6da --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9f869bbdea4f036ab326a7d688e70cf93c8946e7bb4009ea2f28c6c7b1edb3a +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_45_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_45_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dab855713d03a9968a87e7b4166fb4626b2ccb47 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_45_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4652473dccccdfae7fbc7221e85c1812f250d56b4cbabe1f9382467a0a08ee61 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_45_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_45_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53a601b2821019051b6c0b302194f245841e91b2 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_45_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c41458a20cc1f9ed1e984814623c02737b31c1c96e9f10441295705361f9446 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ff85c628aa916fc4f2b15319ebbb18aabe74eea --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3899a67751708afe0e2804b56453e9f51ba4cc658caaacf7dbf35ea3d7e31e29 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d0db57a85c60a514ac4aa49ec3fd827b80e0dcb --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaa97f22f42041df170af8845959596bfab794c6e7c79d48df1af7aeb136d29c +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_46_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_46_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd75d4affa909d7125f574211e7ba1fbfe075415 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_46_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93ed271683cb1358e53d9b9fb144f018a733ccdc7d3e74fd504e73004267385d +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_46_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_46_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c17d5e411477fb3f94bcf06b3792ee2e680227d7 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_46_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6937dd9ad20599f7bdcb7ea116895f2dc42b5bca12e5c67c403616272c368a1 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a76221cd55b831997854d31449bb0e85781ab9c5 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af54af8f97707d92c260080ea0827ff3fb73e48962b69dbb8000e90f86542af3 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46174e87cacc4fd38ad8874a6ae5487b74bfc339 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fa126aa6e3ba67305a1928d7e95eb17eaa43cd1eced9ee5ccaa48bc0144683a +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_47_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_47_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f485d9e15791316dd8f899a1f2175b628bcf613e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_47_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf364d42e2fbe12a64f73e37037d41251448c7ed7d4f97b327e2e2dac05215c2 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_47_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_47_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5496631741cc7a15b43bf5ba8de52f9fa0479a7a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_47_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4572d49fde8d567d873663750d2a1c44e85268ee07c44da2e9f8c47335c3afa +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aea725a4fbe01c0f15e1436d031a83be62bb857 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b3ae167d48c032025f895a6b9022acd815276b5bb3f91b1bec3caff915f610e +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dc605667123bf53fe332d945ecd0ba2ffc771ef --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2da91919c8a65d99ca180eaf82689cba69b3cb0431847c3a98432daabd4d148 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_48_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_48_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7419bae9141080c88e7a354d13b34aded9ecd92f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_48_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e332a607372084fb6fbd7067f45744e0e2f15aa3bf8546a0b270d7d367e4ad86 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_48_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_48_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5253ab62a1e835901dcc3e78c0450434af6ed596 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_48_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34502128eba8392d0566d9d9ca03c8ae6453f8aa39f7ed33e677cfb6f144479c +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2be87633c4ad764e1ff6f601d49a9184f9ccdeb0 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:495cb7b0e40329a4b272f153cbdaf3ab6011f9c8417458f612d1480bef2299ef +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84c6a0c50fe186e94fc3d054a5e656d86e7c2a3d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24014a980da1aa139f9e9880c51c13d8b8d2d723ae2890394a76a2a54dd23784 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_49_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_49_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4405628ac224974877b5de5b9809d6f6174d75b --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_49_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fde485e2441d84c27f0c6ae7ea6e1ba59d30e269183028eec07f83b161faf3ec +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_49_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_49_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef8b3f7fa915b4c12a23ed9886ff89ee65a145eb --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_49_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfd03cea2eacf563b944b7eb830bcce52e4de3a9eff6ec21c085036fc42fe55d +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8051cce99cbbe010d7095c6c448b28ba00385f1e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6e3dad724840a44d7a00f6616c47a8c37cd0aff324fde21c6ec90ea63312fab +size 208731415 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2a1691104ce1b8caf84c5f836bbed38f465b434 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37f5631b32c3119c2fb4ff121045b57bb2fa385851eeef33224c9baa117244c2 +size 208731415 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15898db0f7bf058bb217ef15ef88c2b8e6cd1db9 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:476f1ff7dc9ed2d4160d9c54b536c0ce54d6c08d5e50c871eba96e13416b581d +size 208732183 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ddea18568e0fee635702abf66d537e29c07edbe --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abc343277726c344c7e9bbf672e1f9307d176326767f7970207a6e8ee179fee0 +size 208732183 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4a6470255e8c31116fb4159168fc18a00812688 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f3c26e6af67f005262e74a2af99dd4701754c32fe959e5cac6139dcf0a4c7a2 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62d6ec416ee0b314b47ed2e5eab7b7418b0cba2c --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1d46fedf20144e2d8e5ea788798fc1abbdf64398e21685b36c0534e1be2ec75 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_50_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_50_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cc2e87426f76755b505e3ccf2fb82601dc1a3f7 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_50_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8c7c97e367f0de688fa38586ca8b446593390db425d4adc28f3b9b2dbbafb57 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_50_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_50_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6b82df3f09ef8df921cb668adc1bfdd79c5ece7 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_50_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e3b7e01b50a3590114d8369805146009d6d0758456fec5c06e80ff99cd74a83 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51464d0bd2293a3a6201f8e0048c2ec7356f6981 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02f0ece01343b76dffe068b89357ddf4be1a8486ef4ffd7111c1685a2a12c5f3 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..659a21e28dfb0d4ce2c9ae22d22536b72edeab94 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c804cec2a351112e41abb4ccf984bc205923ff6271e8ca2dba0be439c5a97af1 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_51_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_51_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0dce70c85dca24c5cadee4ca50614a17d00408b --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_51_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0d13aa67ef62c2cb3ee017600d9b601544da3ee7b67989b2aad98a737e9b02b +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_51_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_51_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed4c741672a1ee8cfb1fc120c4bc9909c7059481 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_51_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ada9a943611104c56c4e5b5c465e0b5ed5597c8c0e17110a854b5a45923ef050 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..460accdd0a7535e95148452cd418912105727f0d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ba4986cf6dff64c6bae9a9b21e1a719a972bbf8527c2f8d521eacc67bc8797a +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e6be00df4f5fce9e8762243ba647d1cfd32eeea --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcd9741b5e9af163dd1830ce42e1c61a019499d317e460bc969c4a4ef2044f04 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_52_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_52_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a64d2e7771a4bf7d85f93154b53f00a1f58e4bb6 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_52_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f99f24419a2f63bdb776497659845811812eb3e32578d5818152fa91434a915 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_52_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_52_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f0e2247d7d1e7a9449180f12ba04ab5cf1aa793 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_52_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c43c9e0d01d5f25c5c3a1bf3f816f54c60f55ad286a1b30cf5902a0fa87e091d +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5d69fbbfc714730b6268b65effe0facd986f5da --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9669c85afc11de5b36d3765ee7ead900d55d4030fb7ed7d6029c45d4614e5dd7 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd03632f068c812c40d820782f18b3a2254afc89 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:866ad3bc7e14e407d9674657106eb06801fec40ce15b5399d0effb670b25c944 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_53_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_53_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2ac8eb59ecbda55a690d80b96409d03b441b2c5 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_53_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:495672e702ed3ffa82d8f5a6699729e19f45abdbe9f828e4364f7bd55ce98733 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_53_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_53_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85d50256686b0cfa3fdd6498166768916fade005 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_53_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1072028e394effdae249f88208d7a81dc1a0fc0f9acb0c4969000f0923e7681a +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d1e2eb6e688bb334d0d4d5a812c59b0ce8c2c65 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a8217ad9afb62d39fc40b7f80c4169503eeb387e4f11e9356fdc8dfde4e359a +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7046788c8571685c733e6c6799df0c4acf97b0e7 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e110e8fbd7e2848cb216e1aec457cf7795df1e0fd64b525810958cdfa5bdd39 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_54_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_54_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3581c66e529fad53091019cfc60536174ab1156e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_54_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1c8eda0795e0f68f60144de38bb00cf6565cd4f727f3bd3a68c196a839c8a43 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_54_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_54_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89d376f52523ef67fa8d69d5698ca016edeb8c34 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_54_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba524a1a586d2c6a9b774a800723711fdc68207078784b0aaa3e82ed31cc44b6 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..679768e404eda4e28b38829c74b2546f80cc9d1e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3e2d7478bc9ddee3572f08e4b4c7631d3cca91d6ca248653704cb1ad9c6ca3f +size 208731298 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb3ce02d4159e3335eb5cb13808f67d7465f8b41 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffce34df12252093352016f13e71a4ced10dc664e1f2eaad17e80f5a331cfa0d +size 208731298 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_55_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_55_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57257f0ce0f9bce8df176e5ec84f9c38c3e9dfe3 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_55_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af217b53b46b0d731909b0b0537547deaeb20a5a0584423389b107db80fbb2e8 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_55_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_55_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ac66a1a21792c9fa418ba3b411a24f3b7ee4a06 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_55_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a69c8df5581f175f30d669666c753e02d29e7e5346ef378dd5dfcecaec2add9a +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d88f7ea1cbb3cb49fad2219458eed726e3c5f9b7 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:270204c367435114ce9d339254fa7326f77be1b61ddbf4dddf37dcd8d51c80e1 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c8e06d532b76c533ff48faf98ab5729a0e2a293 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31514519e570f53a86cf8b116e986478d75487ba57aa7fe9c6b1acacd06b1dc9 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_56_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_56_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54e89df3bc8fabbef4b1474eb4c55b99b53256b6 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_56_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bb1063f5cb508cdc875eb0a64f20576c0b334bbf9dbcaa9da280670ddbdf4f6 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_56_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_56_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecdad1f11f45d75eb84c3cbd78bc5ad4d4d7324e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_56_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6b6e7d17eb0f4c2f48d5e47f6f7df22af1a02a36fc244d48cbe2f4e85b1c1fc +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a37caeea8a713073876ac688c4dea15cce564c37 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:857edab982e13629310418245c8dc5d8812f119560464343449914980a39b832 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab199aaa749ae45d98f69766e3a46d0510670146 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:596a07cc3cfba5444cef9bef8c3c1159975db63e80233fdfcbf2eb085bb55161 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_57_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_57_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8fce2cebcae94f4f89add0e1f262dada0d4e29a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_57_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d8eb3ba25e2056b882333249531c3e28593449ff9eced900298b3b9661bc824 +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_57_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_57_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..428b0b87fce5251f038e836aec8503b4680ac90f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_57_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37f671b840c6345039676b0aece27277a7eec3f314458b32189a757549e271eb +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29561ecda1b8e3e8f83fbe078362e7cf5fcf388d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef808f8eb6533e990cba1c5a99bf9010ceb4efb9170e3ad5dd14e8ffaeb0d3f3 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8f9fb0733413c51de0aa34cfa9e499b793e016b --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ff3897a11e564841022324ad83221b53191767580f94060512960f235bde020 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_58_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_58_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f7f16cb9e4853394153fb0a39a0e2e4395c811b --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_58_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f1f2406f2ca2a3b7ab4ee517e4ceacc7978516dd14f2c6e72629a0657cfc778 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_58_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_58_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ed845e53fe763a001b4dda36ce08341c8e9c7c2 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_58_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15406f7a3cff1c46a018f47c422696922ac212cbf4c4a7626c57c7866a2ed49e +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1cfa73688f22a6c46d3ea3c1779621731fd2caf --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7abaad3434f5c2b7002b10e757c9f7faeea0e6e59bd366cb1a39a7c079e6d262 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..825f1e6efeb62eaf1314c4f9fcfe7178a2d476f1 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95d9fd94740136036a7c9a3e112bdf89163d7c2e265941da0b00283a1902b354 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_59_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_59_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c698d3b6a4774c594864bcd2010d1789b14393bd --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_59_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f930bddd76a2b5e382d02f131ca7aa9f50970a3cb75b140344de746693628679 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_59_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_59_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56ccd9add38288f3324942fa19f48ffd6be7413a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_59_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71d9a26f74dcfd675a99a81f7d44c1708e65b41c57fd795acaa85c51d002cd44 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ab2d18ab35167069f73c9602a5c8c8b0e5c68d9 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d390a1d8a319e7f833a7c5d06ff5dcfc925e725c9dcb7d2a68a9c53b0da21be7 +size 208731351 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b096720d8b9815892a7b0afbf6276bfb81fa4bd --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41f47e7dc53865df999c2bfc97602a531fe3ca6af9a8ed03cb78939e1ef13d22 +size 208731351 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7701359d6998ebd383f468c009148fbd8e9e429 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8909fb3e1b61b233e26a5bd8c7044fdb8bee7405369c385976b1693a01093b6 +size 208732119 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfe7e7956e8f20037794db137f16fe246fa09a18 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8022365ca824a18028a4c9b5a992aa0c340e437fbf59d6d5682c48bbda1ad738 +size 208732119 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e281d3a56891139399c9084124fa7943164f23ee --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b05dabe8e69efd1b0e279d3f2eaaad7fa0e64ea48ba1607a7ab0e6952d403353 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ee27dfa8ea327d01adef402d158552a34a4e723 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40a78f8574f1a69efc0b4c00e6bb301461939edd2180680baeced6dd65f57357 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_60_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_60_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d67e0aaf17035fb4be4819f7814b5f33d169f48b --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_60_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a18bc14acf8ef9b5cca8bb35cf0020f761b894df141930f476d331abea368a6d +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_60_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_60_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7db6bf0865041295529feb7b36db1488cfdee7d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_60_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c0502e0035fb4909f37eefb901b05dcaa2ea55c3bf7ee391427d998b13a16f7 +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdf7ca794ba450f84f4deb04a97b0410bd2a71f5 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5058693e726c93038479c30606bdd6861974079fc0de7adcd14ce63fe3c6f589 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f4cbb7d4a0d3c92cbefbbebe0c98ed5e13796e3 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e30c76b6df2f2e3ac309f655f18f90605e8d94fa2f89e2de2264f94df563434 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_61_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_61_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..486679212ac181461c287315f59c6026f868463b --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_61_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0c5e9c7315408d63bce678df8dd67752c7c453af65d0c1ba71c3a3b69d1e29e +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_61_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_61_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ab69628de1d3b912599a3e820f73bc5bd342f37 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_61_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:210512b96e5a7fa395678b879676587f34166f35789719c0487a37cb0c2e730a +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c41877ad17fb8736aefbd29805479ba5f4b61a2 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8058ac426e1b2602f238b76845ed15e00a0805545b4d69ad7ac2ab0d3869ba35 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2c72876a4645f848b4f8d28b6f93d8eb609b7be --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21bf70c5b2bb26c5bad769493d514167896e4f02e0296b5d669120ac849b97c5 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_62_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_62_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e6cfad01ec823c47937232ef1ebbfdf9a4006a7 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_62_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89999455197be6607b59922e3e1da595a5a1b6c08bd0c3f9f37492e07d71c280 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_62_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_62_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab74f1e3b850e006a3719b721376675513ba0654 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_62_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b5b02bece00935d095a90baf5170e735e8596f88c46825677f7b42f0686d7a2 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..971034e05639880367aed7cefffc7e81b4fcdd14 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ffe01e27e83cff2b02d72425aaeab6b7010aec2d41b5e5053ce072f6faf4f94 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..666a12c9c95e3cd927e205a9224d020acf703237 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c83d930f41fb68eeb20f667ab5768b6e0654d8180d817802ce0cb5b29cd8f9f +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_63_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_63_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9faa7d446746b72c6f8677789d5e94efcca7701 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_63_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7087d2659ad864d44f63e139ffa846715e004e9c692cde3bf1fa0c9f2349d6a +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_63_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_63_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20ae0acb05db0d793c6690cbabc93c910de0e304 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_63_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1ae0dbae7fed683f802693a0bf90061c2fce4b39619bbf329dced1ede23b1cd +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f015dac41648e777e76200f26e82fbc67aee564 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed0e6c8df5252739c7c00dfe33676a9e34b7eeda91bb048e56d2ac63d60a6e4a +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8ec1dab327452f6b75c4af0de1c2db62940d6c --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d9d7efeb9191b9bd7c5ccfcce0aa036014d37eb40785c500c255cc0280ca242 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_64_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_64_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9846a379782740d59627a0885aff73f6e17127c0 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_64_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:348dc09eb3bdbaacf85f2cfb73d372237049e63e216ec30bcfa2e1cd9b9ba288 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_64_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_64_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef3ef803af5be84b030bc068f7c1ac307b6e25b2 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_64_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc61401e857891af3501b5102616e09e5acd7d8cc9b019f53f9fd5924220061e +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b5d6e6f9e81f84c5e7c76f1c197969a88ba74e7 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8d0695dac4681af45daf8ba862367525ff11e08b0efd6c8db6244272eb66e12 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb1e292fe373b04b25b8160cc9054596497bfe25 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55188a5fca4b4c625c0620c1c97b6ad0757ca5de52516492d86f8772af90be4 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_65_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_65_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89d6e9731fbf36319d1f47c2de4e823ad4b0cf96 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_65_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afe0baeeadc5ac8d3f8693da496059c574b464d5c7f5b10b148893869e43cd4f +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_65_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_65_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39533390ef523e365a599f80b7f01079e4a0db12 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_65_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0af14b5f4240139359d1aad4534da0513e8b3286c7066cc6400ce429ff5feb67 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1354238b1918c08d896257b31e0a2a69eb5c2bbc --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c02558dcca609bd65a39152eb3af26a6af63d622ee56ed8872c924ac5289e2e4 +size 208731298 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8dff12f5c2cfdea893b86c7c18d0ec112227d0 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d823165295de44c53a736a4c6891e4be15c94d4ecd9d203a3c8716d2350eb807 +size 208731298 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_66_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_66_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7d88c8d347de8db8e95bd008c742d5375e5825a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_66_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebc07398c9405b1378c455f5eb113db0e0cbf3380accbe10b6bc5b262db5a687 +size 208732066 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_66_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_66_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01568537f8db42378e4c6d438a82693d428bb46a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_66_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee30c439916f176e78e8a35871384264abcc56552660e37a7b350919889ea7a2 +size 208732066 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c2a65dcdc91c6e70211fced9a4e86025de3a717 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4deff7ba5781bee147ac6ddbf7be45af4557c3fabd316a5cf4f24fc429ab53ce +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1228cca78c99e5747dd2b79d90dfe2f38b5205ad --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e4509f3c954ccd3f9fe105bd4779eb081ff8e79191a082e8823eac584c22811 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_67_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_67_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c656335b717f0cbbbfe64d506b8b17c30bb84e00 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_67_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7941fe3c26fcd1d93d83d647ada97cd70c25636d05c30352c0bce160b9daddf +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_67_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_67_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bae8e9cf9b71c95c3de8f38d70b5fb5df0af4ed --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_67_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebddfeea7c0abdf1e58dfb90d10aaf11d1508ae76420cd5a4f8ec288072f0980 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1550e3ebab5ac1a66a8afd9412394d2bf2a0ed2 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a84c98761d67648de69fec1447521014db9af2760fbbbe18595bef223a6dc193 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92f6723a7575fce702df956a3ad023440bd48e2f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e29fc4ae39155686f63669f802cd71b92a908a57479e42f6535ee0a93a0130df +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_68_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_68_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10a1bfa31a57d496f94f6e6ec1af0e8ede384d54 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_68_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01f133b21ab9fd51cdc4481a4067224572d9e9a2c6f9606ce61ec67ae1b91f7f +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_68_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_68_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0905ebc2a4657d9366bdd49ed57abd38ee322598 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_68_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82712f6dd40b1fbda8072932f4dbdf92b6f124c5990e204620e11dcff5ccd042 +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a245a77b70d9ab0aaa82c1a1fa93557043d68db --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb3657c436056700ec9dee872ce015e01e753131c2239160f1a9c9500b43f58c +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4823c2e30eb34f56088c0f14dc4c8be2f120e282 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ff8fe1fc313170b1c4de3c2df1a70edbe941265670fe6c26e308aeba9f0b4be +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_69_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_69_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30aec49832af79faf389b41b57c6bfac07c2d43e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_69_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0791485ca0b9143b709b9b6f293520aca13ecc780414a409e5baafe2367d8551 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_69_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_69_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f522194c8727bd7f5d4b1299cbbfa9424535e4c9 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_69_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79c72805d3f6dd1eef9faf0542246ddd3c396ea928c42f016b3c365bc05e7df9 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d35dd446b318e74a6cd1248bcbf5222480e7140a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ad8224a5a1c7c74440922c3c68ee73ff0a5a1613194a3ea80b710e9e18bd16a +size 208731351 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d1189ec6f3d7eb9e2a753a253cc12ad471d3e67 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:637466ea05b2cdd18fa743c1e4f8d6cd77c670ab2da63bb43fb01c946a937bdc +size 208731351 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c15a977e9728ae2ce1d8a4d6ccf375573d05ca84 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64c3ae1cd4f0bdfd43c50d7d6e6410832db8fd6be8ca29bd6f1a5f7082f0c14b +size 208732119 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8541578b79416bdc151c55cb55470efbe26b831 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:884ff231021766b22c926401252cd5dc6ec68dc7957781b395776624862d8d6f +size 208732119 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6869cc69eefa7fa6506c9759d33c9c7dea2b25d9 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48148d50fa1563de8e1c94be97e5a2a4ab8ee61d83e6447d782946f8231e33e9 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..092d44bac7ab79e14b6a4efcf62e44665b6d3a4f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c32d6ecb1bd8fe3267df4f7c1c4a4d94584bf4aaae691eb98ffc349636fe2b50 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_70_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_70_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51c0e5d65e0ac448e76febd5a778a34e94f86d16 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_70_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0192b687ca0aa9cda2501d993a5e19b5ad6f82f8a7a92019be7d15b1b7d28d4c +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_70_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_70_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ad873253618ac96039d2bca3f27675ca11ae639 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_70_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40566ba2bd7698e7ad5272990e9de1075484406b7129184961e72ee5e42225ad +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16d982aad38a860054fda6df1701d022670e25b2 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa5b1c86e2acfd28eba82de495a977ee9de22420a93de3bfbd067fffeeaf6255 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c92ab672cbc972fd3387af8ac26cae3e0bdd31a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8403cccd5ead964c57c0da3f44ceaa7019466655ee461dc71aa4dffe0a14544 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_71_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_71_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fd9c80fdc21f7dd8345cb8101ce14e27b97662c --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_71_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d786b40343d946c2908437ad59b2980eafe1e2bc711f859cb14a7f3d3b9ff825 +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_71_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_71_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39b275923eb1ba04528c4b1781e66f824738341f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_71_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:740dce527ada34fea3c8d3d818d4221b62b7f73e47b923bdba624c34ebc57388 +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5ad7dfb8902dc4bd47afa0a309ba9332ae69452 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15b35b194cb8d719bc8d5013a675b42f9e8d4ec5af13b96f30dbb5a2ec295ca1 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19882b5895989a7f140dc9fdaa1188f867ad5fc1 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55dcd15da82ec6d88ee7a2537ef80840852d75cc72770226bbf624aff95e280 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_72_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_72_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8a179496ac986ac85930353c4d6152acb2e2033 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_72_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a0fa72720d39e575e6f09a98c5cc78c156790e7ac463996de18dcc96657d513 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_72_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_72_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cb262d577424ece9fe23de711088df7ad4ef610 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_72_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:675b0d59e3cecdb73f8c3c414772d3325d12770edab064a51c7cdcfc41aa4244 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ce48ad528cc2411755ac1b25d333b735a8a911a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c0699a1f1585bb6e4dbd87b581aeeec4b398b4925926d2cabf085b216e41a03 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3d665746daf11e6f6cfc4f20ee93e4042ed6ec2 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd7a8624cf61f769518b3b80fb53d9951096bcfcd7b133bedfc62e5712af49db +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_73_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_73_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd78ac0d05195fa29896bd97a14186a46429bcce --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_73_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41b366b6bca2085997b639e1d04d03d2f9b5ad1d22705c13c75e309e0d2b7025 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_73_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_73_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4915f1deefecd2d63dbe7f74d7e1612d27c0ebcd --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_73_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c8998a46855eeb2d12552b635a10201f63d75a2d32936295f1ec1cdb687238b +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a11e05077cf5bc65ebc7324c284bf5b5de1b7e0 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b60c5717a90d17021d4892b3c78fae08f2b6725ce34ef19668f8560e8fc2803 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43a9045c3af8177750d9a11c059957cfb7bb0437 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:020b3508c7496d81722243fbbbee930bf1028f85ccef89a6ac33c9afab887fa1 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_74_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_74_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..513892a47977f822ae226b01ccdf31565e653d7f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_74_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09afcda3a61adc6f24973944353ef0d144d18b1b9717e694231d149cc8258c03 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_74_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_74_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e85a7f6635f2bfa3c81184734bfc08d9927f661c --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_74_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4badc05e79618ffcc1596319955b1238b23f050b337e4c76f0e40df25438514c +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6df7f7c0da58ad23bb5fc516711f2091cc34c1b --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:570cbb483db1c4ab82aca08ba007ff140053404a698357ebdaf050d63e80d2e0 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6df3e1039b5f984418f0c8a7a637570377d47012 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c182ca57b196410301e168712736cfd1c8b1492e5736473a815a944468a6691b +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_75_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_75_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dabae95fb81800a6c2ea4406d72a8c16b4724c8 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_75_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36b6f09b0bc2abe689dd655e258679c384e7e1326c4d8d72925f9d920b26b374 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_75_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_75_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a47943ef5843fdc8620dde3f209d99fa991b4a3 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_75_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0234734d5359a5d29844c43eb676520bd020bdbb94abd2646f16260b5bc21486 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8d9c0e0bf2a9b58d659b2a554acc9c1da7948c0 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54c11ba2e2c2e053eab12b8c13e861f1ffb3ea74bf1aea3e42af402c2c2622a9 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7332371edbee964ab753d9bbfe0c0731c5105ba --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcac55b2ebe90355f0504d73fa542f51ef843255d85817b068820edd53305216 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_76_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_76_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a661158edaef4bd54276b9a96448296f0a3d607c --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_76_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0b217b73c202b5a536e298eaec49fffe2f6656f7444fe30037a6198406607c6 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_76_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_76_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96da1142b5f2d2dcd9f209f6b100f1f4bd010c9f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_76_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40f3c1de67b3cf2b2fcfd8079482c367b1595dead6f87c90879e697be5caedc8 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18fddb8c682ed035fa1793cb99f2db45bf0c005a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:573c2f040276e698fc8d867362a6ebd46ed36a41a1795529d6ab9472aa5d1741 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..614dbaf49cf112b79420d98b6b49f626c78b5f03 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91cc28d6079a5103a8e84bb42e4565e651e4d2ba53874ec9942ba56d0ed2f78c +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_77_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_77_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3428d32c21458999da99249fb1aa46093fb02081 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_77_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e366feaf040b473f167aa24de5b4185e31350ce3bf3ca4cd8000a4f81e1f7a28 +size 208732066 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_77_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_77_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06c251a91603d58f6b0d30d4ad8df37ae25fe78d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_77_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73f7894dafcf84e852282ea3c8badab3a680e76229ba0c30c66472865e3a4374 +size 208732066 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..480b6cdb81f9a52c02bc76388f1c3a4cb701d6cc --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1354a80d0dd2b2923a21039ce054b59d4b04e1abe21a80f88a53436f743c713 +size 208731298 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be11ba385863acbd4b927e1b6786c4cc21e80293 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ce0b97053e355c570d9723386a85e1f23ad6895acf5a8b0e2c404bacc1c9756 +size 208731298 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_78_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_78_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32e2a5b479f5aa0f2ed393f4f06611a8a3afbc1f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_78_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa1e2dfe89df59343f74e9240de2604cf9b044f362ae0b5961fa84accda8822e +size 208732066 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_78_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_78_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e916003eb34953f9125731a73bb6c57eb3bf354 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_78_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f370774ca853968d1219e6757a349929e7a9f51d908a499f460b3b84049c165 +size 208732066 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a95fe7f11f96ac5f9b7f50a959dfe910b5de524e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fa5d5d85274762adeb4029fcf1c84f0ed068fe8b3ed2f5ca936437cfb87e006 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5c2723e99058c70ad7795845f07c2291f8aa374 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dfa816399a44dba6aa38e00f601e68c921f0606e9b07580569f9818b4fb62e6 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_79_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_79_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2574b378ba423bba51ae3222f74e259ccc999a67 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_79_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5cef1af4464b77470c16d29e04d1d7a0f2078414d7ae6bc6e27cbac75331f85 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_79_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_79_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ebec21d684814995f59a0538b871609a8ac63e3 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_79_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:833758bebd39e1c2074215525eb9ec03855f8fb1a23c9a368612aa26d3c6e2ae +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb1d033fa95b9cf011320cc88eef618e65d43da2 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:845f53975d83eba68d7f7063786eb15878bfa1272782e719f76031140e3961a0 +size 208731351 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b48b06f11e70a5ef61ec47944113e82926a0e6a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b123a94e83785ddddb0f3893b10f768e7f432f3b3b7cbd96a8b992cf21e7b83 +size 208731351 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c9b3c96d9aa092f709222a204143d3e726e27ee --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe6500dc43cb7f065437ac4dbdb68bc2801b31902836a2a20af5adec553a16f4 +size 208732119 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce331ed88c5d1f56fd125ca4d786f45c5f13aad9 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ada41f90fa1830573ab9a963d3386f33bb045d677675d392a233ce96fc727d3d +size 208732119 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5c14ee3342008114edc986d0187053ceae94024 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0eb013dc8f30f294087ad705b6d0039ae9e559b2bbb3cc6e730e0ea9f12731d +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd8f7f6fbe409f9a69ad365dfcc7ff184ddd81fa --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a4951227817e51ebfb829381625144c02b7750379b25334f7fa549f31a10358 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_80_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_80_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a88085879cdea8ddff0e7d7297d61d2fff08975 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_80_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4471e94ef716246177bac31d3dcde94360b5a22e4372f410d98e87eb81cfeee +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_80_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_80_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42e11e0f16193f0f23a6a558d25b0eeaff390cdf --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_80_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:332924ad5bde08f2629cf31e5e3177857b2725db2dfe295e88df6def27736658 +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62cacce0b108dd243d32a7eb56f379f21cf644e4 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf29779fb41a7a155518c9b4f724d3e90cf8284e6f187696218297a06f49ff71 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3980b9e81a064c4e85fa5f3c526dd7f632ff071 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e51b81aa0b82a6b01d8f6eaa5f317cfb5334a27b856f5d372c08062a1aba4f8b +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_81_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_81_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9fc2d6a06ac38078e2f0b2388ed9040f5e4f936 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_81_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a2af9616133b325ca7a37ad40204bd3c4b33077c4ac46568e764d23d5e5ffb8 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_81_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_81_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9aa7f4dda5fa107f94644cad41bb38691d65ffce --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_81_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96643ec7c41e9afa59bbf419dd8a91cab3af699e24cf8e91c1446904b0203174 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..472c238e407fc0cc7d1652b4d3d9ab1c92fd5343 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d9cb869f96e644b707ba9c012c48ba6ad7dc530b0a786a6cd8ebf21a8155cea +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8b4b45fdde725377a77906facdfdcab9ba9c955 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86808a88b53f2b6b789206eb20d3c2ae557f8f9d19078f3a224fddc5b3294eb6 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_82_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_82_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0891a9c9ec854ba8f38277689a2b439b01450723 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_82_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b218b8a64742308f4d3ce7678e3612a788ccf74b4ccd74e3d9f34cd7a872620e +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_82_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_82_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fec715af0c070d28f0875ec286ad92433ae6102f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_82_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab11dc9e65a606aeb6b1ec4c2ed95ac05c1801e3af41a00d015f6346b738d3aa +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a072ca8fe8996fee5873ff4153cdca84cab12bb9 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:849f47ee64aa24d1a2f22acb1d3220b892998bbbda846e7f20df702789ebbc02 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c52959e11da34c27f849564925d1beac75ccefcf --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6b320b01a60730b722b45cdb60006222689a450454b90c1e272f99cd26ef7ba +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_83_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_83_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1addb64c854939b778172ff631efc4146ee0fb5 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_83_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8c4dc36aa79d74b3572155c54bc6d012cbd65160b34ed29ff918c5af1d1149a +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_83_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_83_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3b2a3b65c1b3924435cfecac5395c54b6be816f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_83_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc947a83e72b33dfa36c1b0cfc2770205f39f097040d6c06021abd2d33edf8e0 +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d5715987c019abfd78171b3a4d6aff703c6058c --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d8868e17c901afd452f9001dd22b26ebfeed893c9143225e0c99b844826eed2 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..603e9e4b092c8f24084813a9156837d6a58b81a4 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a72943f9936042b6837932cb9585bcfca8aa3a81d1001e1d0f662de58b01c234 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_84_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_84_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23d6d830c6cdeb03d9157b4801688f95ebebbea9 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_84_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:978acfefe11764dfb2af7a8986835bae7a49a541c7a608533c427334a35851a4 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_84_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_84_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7300014235c658609dac3c2b30f85a5f15350c21 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_84_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:872e35eab705dcf024ca8c4af21fe9e00c077f7d3ffc85d152f272da5ce84817 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65f468b3b71617757d13970eee528094e74e235b --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adba824b7652c1d0520b0fb7dfd11e4f943643fa0fba0abead68de8e7f0093d4 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01c468357ff3c92b29c147ba15cd67ac69870ff6 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc16fdce1ca086121944912fc685958e064b3070ba2363425c56a13c0416967e +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_85_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_85_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bf7840e381eb56d791ef1cdaa62056ce8884341 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_85_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b76b5b602069a8e15baf1dea2b6a614db9846fe022f349ca372682c9de54e4c +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_85_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_85_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55d6ba60a228512e696f5078ac9349860e065e30 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_85_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42330617058585791b901bd7f3eaaef2e71ee1420c89098cb44bb081a0d3dc2d +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f902dfc609d8e699a69dd2018cb55aac799da0e1 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a85647e685ff44355da081209b9d4300cffa455f062900a7801c803be2ef6a7 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da839f5a9163f8924d9a7e7e6ff3273c35ce400d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25c9daaaa83f386443f7d505d9289d3373cd2fcb848b81a6298777bda21fa68c +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_86_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_86_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44b63162a40b14b8434bb15c1230f8fa2c225125 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_86_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de2666415c3b72e9ce7e3a4ff1b43821b3c7fbb29157f910d38b98945d7fa0e0 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_86_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_86_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9187331944940ab63b5dc9539cd7a8bda1e22fdd --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_86_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddc933a82966670e3a2d5cd9689509e572555a8a774d7b2d0229f741d0eb06be +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ac726ff79c90597db3c93de4d341aa012693037 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:755fdba4392f156ed859210a74a856ee50acb13372cbf33e85fede7295dbb840 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6ff9770993da9e9575d1c6b0cb3468efe3a904e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:182709fece5c2c6bad37d50e5fd49aad624e9d29bd27feb691b8dc5ef009412e +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_87_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_87_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..abbf7ac0fc5ef74db2c39c84fe5d31d290017a85 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_87_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec608b66c9509d302278311ef53b0b72cde46acc9e7a82e3394f5440ffe0cf11 +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_87_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_87_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d188f0b5b99eee8aad6db7df4583343d7c9ccaee --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_87_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0154a01e017840f5caa5237d6e3269ac1524a8b785e66adf7debe9b0a3a29203 +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..010298fd5a129fee26c4c50b531cd1433879f3a8 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81c62d55e4f7a0bebd0f9a082941d18d961a25c6b6d71de61a3b92a10d5cdcce +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..250759e0ffdff19dd945001d8feeaaea65a1e583 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5719f6104248737030d80a3400bbadd0fb20e96826d7ffe57eca27e2982978d7 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_88_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_88_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db07c471886d63c31ff80abe057bfc25c82978d7 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_88_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b3c8750175470258fd1681ca859ee1bbce20f59ee02e0c1267d7416d35616ac +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_88_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_88_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1801f4bf22ff5e6391b4f4481dadbd76e6544211 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_88_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:510bb01b99cffc7702da8627357d512427a839882ff8055e68f048b88ca471d3 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfe05f55c5a3fac90e20dca8b9d8d5ad5293d1e6 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0ccf2df9e7eed544a37de20c1cd160c00d41d0bbf2bd709258b6c0aa565ec29 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f74ced492cc6253708b4889072e3842126dbeb2e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bfcab1f098100afac97df5fb74a9270973bc9055180d8675d76c263b3e2ef57 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_89_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_89_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc30f19a754117bb2c0cf558e8b9c230e5ae0593 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_89_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da073d707a6966afc53b9dc82089ef50eea34797b3c686dd21cdb45f80fa4cec +size 208732066 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_89_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_89_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b277142d00983ce0f9ef098929cbb4053421a92 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_89_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:456cac8efb03d9e0046c9c3d264139c68d9f018e31ab09075f1ea5830253138d +size 208732066 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e44774c895b764e1993fb097d718356c2cd0d86a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60c992221a12b927d208406dc02c7c62ca8717cc034c6875f7e0dd62361c705e +size 208731479 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d84b466f2f4f4f0bf7962686196a01cd2c2eb004 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f233366a70253844746a9e4876eec6a850dad71cbad8933dbe5a153f3bb4cea7 +size 208731479 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e27eda4c7cb90dad636a2563c400191c651b5bb --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d292d72968ee6aff02006332c35caf740f265dab53a6b44e8fb9c4c0c840c0d6 +size 208732247 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb43c5cd6c9702c5ffb4673949bd7b6372bd80f5 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f9af54c7b55555d20ab7d295be971d2bd04b005a1c7f134929e31ca0816fd27 +size 208732247 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e491170a77481a7ea79fffb1b96516b958bd0a78 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7329aa27af758ff1323d50d4993a96d797b90062a746811cdc91259a7950da46 +size 208731298 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbe5c993c5fd6bc894b54de370aa8b299e291f29 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca4ed369199efdea518a85c50d13148021d27896c60b39f39294a7edb3df59a7 +size 208731298 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_90_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_90_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fce9999f42c8d71184622e784ae4f66d2b2e408b --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_90_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6acbd93976c157b9abe918ec80b2bcbead7828de2ec221afea3255f973adf2c0 +size 208732066 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_90_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_90_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e4ed72cd1d4dffc0ee621b33cb72c4f63f31f2b --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_90_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca5fb6bd45a7373ccc5c4ba234cf76df5d49b08f8ea45fd24e4e8bf024c39367 +size 208732066 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45f48f41887447ac05851ccb314ae2d318c6deb3 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c76026686c1ccdaed3d4a116af24a84dbd824a052af1883a1b96234d1ce50b50 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd9e4310bd51adccd5ba0e62353734895808e6d6 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6540a9367c71112eb91a644e3ef9b0ae419433bbadbe2b8f892e2993b32d0f13 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_91_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_91_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db3898ac9a1c756e3cf3872433b25c03f63d7340 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_91_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbf61fb1cd80d05e65620f330c41476d53cbe5d9e2cd023cd0f5c36945bfe652 +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_91_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_91_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..042c36275ccd50649ed811428af9a4cc840522c6 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_91_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac0466196d6b3205c9fe2b866baa2acc64b1724752996fbff03de06dc3f4b070 +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3816d00fa6ebe96702212893ee6fbb35c9fec7fe --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7ce0fd8fbd09a8a4c5d07fde8ea93ef211873144514ace14acea0a38d09bf4a +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a73c0d7b2078aad66f96c6eb5c8369251016af1f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8db358362cef3714642c49d1530f9a1754048475a92b3886d198c3a13b15812 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_92_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_92_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc47020f13a752e487c91e514eac65b4b5c4ab75 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_92_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47b16877c96b7bbd64ff9fcfb77cf5864bb82cb6064d5eeaf5188adf6846b20b +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_92_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_92_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..772b64098f044399e97019ec00bfc11412666a69 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_92_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3758ee94923d1bf1de791e441fc82378a7d576feec295a2f83815c2d7bbcdcda +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b76cade84a9d7bce124721dbf54ae828fc7fb305 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7173f231fd5c37b1a1221b5071dc322fc68cb5d50570b7a44ee588673d215af9 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6e31f1ab91d2ab1cf2669d28a1864208a4d126e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac60aff6c98a44681a445f4af96be80beaddb6658432e9d48f6015f1be59d2a6 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_93_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_93_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6bf35324e33ba700b991380b23b546c51dcacfb --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_93_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffdd86f05d54415d21d252d89b728a02832403939a7048dbe97721b07c5231b0 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_93_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_93_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..006b0f3b32b7270311a6df95ad53123a7f71d412 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_93_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ecf73d5a7d327c77f77efb7bcd8fa3e0ac7ba8267e409c733c562ca53ae2f80 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80c61dd91f5d3c23ac642c592d9a96e8cacec07a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e141a27c311e4a70bda4434598deeb9318525be106ccb3070a523601bb749002 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..509dd89b7d455599d14672147bd973658d53cf96 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b15bfcc98d10f2d5967a1dcb36df6292aeb581b92e60f2a0029014c8b23e9a8e +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_94_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_94_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2d480ba4814f1b3aed40b0019936f764dba187a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_94_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8579edbfcd7e03ea693d362687d76d6a477c16ce90fbae68d734046afbf991e +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_94_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_94_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82a9081d3daf2c6e1b0d9bba8493c4c8cc1efd98 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_94_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1412a9e7688fa1e17eb658897b06396c4f6481d9e5c7e66acd98a5f770734dd1 +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15a53f60dcb0d4b67c55fbdae3c27324a3ae365e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbb8f66d57b9ac19d081714becd77e6f2027cc58a27a22caf437b0efeca57116 +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f75da8bb2d7a4da022dbda5ff418a45563da640e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d679b9bccb06ccee02fe5864bf6dd68413834a35dd4d63143774da53476d031e +size 208731490 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_95_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_95_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..badd9a0feb652954eb9e304712ae552eb7f8c23e --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_95_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d037f42682aa1820f8fec044334606c38281566862ab67acc4a4592103aa8f37 +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_95_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_95_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61413a08701f27a7a7a5f69d2909201a85e62984 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_95_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd619a8ae4e547886ab3ec0b59dcbfce19667981e197e6a3e81e100910d41fda +size 208732258 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bacf0cc00711ed182c5f38d06575c855f240d807 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f98bae033b5ae51524de9c0aa71e13cead09ab2ecbac8bca0326a7c87606e029 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a55e6cc3343b7ac19f97c930f7cfc62690c8bdfc --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:240b5c05b4406da6ff98abe6101a9fae9e8a39f8887789954927acbd93e3d864 +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_96_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_96_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..842d745a4076655eded0deb2cdea13ab1c7b6762 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_96_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80002af1616d9f57b5dc0f60173e66d088cb81d9221ff6ed339b68fce1e8c613 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_96_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_96_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d414edfb499847c7f0b885094df9063db52cbe8f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_96_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20c7132922d04f0b7f9b085d675e2bf0e598c881e2986ae334797935eb1f3ab5 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2268d4a6a6952457f0e628ef489847d8737ea72d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46fcab0702be854320e1c9e75e5a5587e60d2d0ebf14477c7056b7657f539a48 +size 208731298 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d33990a0c15e9e0b2b9631cc0316730562acd31f --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eb6c1cdf9c6f70d4ab2e1a560f41ab5618c2989d46e7dae6863148995ee2f33 +size 208731298 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_97_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_97_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1811d3218aa84be18db58d1abd2ed8fadb400b4 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_97_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b780fb503dda0d84b5b162564bb01b71fda129296be6eea224744e73a7193bae +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_97_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_97_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc74968db3c704620636b63216235e488bc28d3b --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_97_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6a44ab3636f123ed50e55e77b9371057e54b3415385cc5f7c75179f138a8875 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c61faa34e2f66e1952b1f16ec2bba0fc6ea140a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:392f004aaee4545c29d1afaefd92a7ba9d9391f29ff8b3c97e04d37f2f271804 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2539a0355ac60486cc1f2a65ec61a2c382e17047 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72e61157ac364711bb8abea8d9357f6c9a9d59a2eed77575606c24dfd46c0e12 +size 208731426 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_98_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_98_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb411d42c6898473afa95dbcc18daac6769041ab --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_98_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0035166fc524d1dcd519b2a0072252dc17e4d5195734b4af8f6faa8bbafd78c9 +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_98_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_98_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f664321070f0ef08e9c7ca1f49dff29c0e135607 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_98_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3da6bec07cb82221eb40c098090a8933d32ddb2cc7c68ba31f036bb24e954fae +size 208732194 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9dd444787f123cded5ecc62ec19bea7f82d3a692 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5686ae9b75f802f2269e65660e95d3a59a23b6fc759c202e430801217c4f930c +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a616efe08324ecff686cd272c101b6c047c3e860 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a694671513387ca663ca863f9c08b7577553ed74c3ac71ded16733b473df69f +size 208731362 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_99_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_99_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba2f0f8745c569a1a179e57b4413a6b2923fbede --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_99_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:080bb723e0227a858a3025b338d780084f7a7231255eb9fbe58d0936fdaf9e78 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_99_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_99_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ba01f466b8e59a49b46c8250c684568d51ff376 --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_99_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69f6bedb28c12c65194451e87698ab34d13bd0bc38508dbe5f6ffeab240466b4 +size 208732130 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1745292a6ebd5ee6af2329709ff132dd4b8c017d --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b45e186903792189ac580c97d5ab44fb14e961d7acc1f9b19c789b7f30a3040 +size 208731351 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac96d7c77265015fc67b304613946866d75c19df --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6df837146bc5cf9208be548c4b51eb3f806a9e00f539c99752d50031c7d7995d +size 208731351 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9084edecab0e3f7e9af1d8bd37a919b7ad05f06a --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf276c5277ed8e2e7d0088f3333f083992145e919b3caabf48d0e240093f78c6 +size 208732119 diff --git a/8b7178b88b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt b/8b7178b88b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6b9e6a4d06680a59fb4371636b253442a42d8ab --- /dev/null +++ b/8b7178b88b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c344371ffece0ec8ef3e35e22114bb8cf177e549c20fa49a94e656241a0efb00 +size 208732119 diff --git a/8b7178b88b/global_step84877/layer_01-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3ce3667b75e8328f5925b0d5b23588f3d2a73d0 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e823be951187bcef96525113f57720f8c00fce42580b80b9dc4225ef5d7bff9 +size 223347971 diff --git a/8b7178b88b/global_step84877/layer_01-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79f993f80dda57d754108285f4ee256ea8c80d40 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54fb1c60718019d20fc547fa24bbc9d36776967309bcb1687c2959356cf060a7 +size 223347971 diff --git a/8b7178b88b/global_step84877/layer_03-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c273c5f55ca25119fe07ae015638ee626bc50613 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa013669b84ade79783d198b03bf61efea8e3089a246e5484ea584965778ad56 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_03-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8158e67bc64f4b44321c5aa7af8e9c40be4bd5 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f479a86ccc6849b056dba451a0a71dc0f185aaef873ef4bc3122e039f7b917b4 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_04-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcf7400153392bc1d063803400405fbe4e2d8880 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02e7618e74a510a62a8a7bab735c990afb55d515a8ed3f50119ee90e850537d4 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_04-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18c1597f0baece304846d3168f5e91e5f72f24dd --- /dev/null +++ b/8b7178b88b/global_step84877/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4e4bee77efd9120e16a520c6e3c1fa95cf98a360e77d1c90c104ab04f6a7325 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_05-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..587e64fcb8838b9000c58317938ab14b9c187243 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7d23838ebdc5d62fb54d93585c06b153c6a3bcd7a2bc4b29afe131ed766db2a +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_05-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3991fc39992e7804585cdd6ed3d4ba3d43b1b1c6 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51e3682237a220dc1d0ae5564c5f615bef277f35427faa6ecf7f9136687f4702 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_06-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cb588f2bf8144eec74e5b0a4504822538c533c8 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d62d60477c71a3451cc67c84c17f4e0399bb16282797cc5d25ef0fd9b63f918f +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_06-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fba99b8eb71d6cf2ebe88422ee9ed5cc653a8fab --- /dev/null +++ b/8b7178b88b/global_step84877/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e9ef8de28d151a481816163714122ddd45b1117308e99016d670e4dcacfafcc +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_07-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eac70c00f7d2c5b70119c64336d312d4688eb193 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e52d43e77ff21b2f3ef20eeb390479ed8e8c81563b63bc11fb4be3268ccac66 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_07-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c73cd3b3e93067feb151bec2f3e15bf39d8a36c8 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10d848a1b4080c73401d8980d99a2bb8d83ea3c03849f3f423d3074a61d39ce6 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_08-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..011e600caa1523f3ee040a914cca32d8d5949a35 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c30f89a776aa59b4c78ebaea6584c58492c8e46c2b63d05889783f1fd89da73 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_08-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8fca8d516499904af502c1310899f7e080eb841 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfca40120c77a80adb19b4122c07f768b7c26e94c3e2dae84093193c4f07b6c9 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_09-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..696892042ac8da696e33776ab49af73dfc3acbf0 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59bbf11153e821651580e8fdf0b8721b72b143863b45f13d9d315f5b274e3819 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_09-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a44dd084a86db79b731ea8430e2f1b2ffed6730c --- /dev/null +++ b/8b7178b88b/global_step84877/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f690723227853124bb116c4b97bbef3b9e019b2aa401951a6e4a15b95a2ee3e +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_10-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dea42038081294a10736069e125e222d94308b0 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63a28b8d70c17edb3a271af6e34019f4068ce1076b2e39549668db70cf7f7836 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_10-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33bba1f953966095350dbf1615128012e486aa30 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8c42e732620014e95c20d72683d368c87c12af08363efba123572ec12d4dde5 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_11-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fac6ad8266a76c0d2e97344d4a58a4ccb0f837d6 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a46dadd08c2ca4d819c81d58ba88673a385e352973803fff47f7ecd2cee6b24a +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_11-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06fa7855dea5cc6e4f28dd4edfe5b04719228e2f --- /dev/null +++ b/8b7178b88b/global_step84877/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d72687824d52f37c2287f0e41f4bed804f86784478efa955b1072a7257118f7d +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_12-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0eab0368404a9c28c911d7eabd176259891a0fca --- /dev/null +++ b/8b7178b88b/global_step84877/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57956fe223edc5da1d62ecf0c1eb0b11240f893d75ca5f10f0bc40258ac3b42c +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_12-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fffb0e5fdd097ae4c95ad2bb40e2e2c83ce0a1e --- /dev/null +++ b/8b7178b88b/global_step84877/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c25872b3fd7e42e674da48b88f77ca9e0f6d63c73284810e4f728181f0126414 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_13-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9ac42ef62c263dfa85859c1d0f6267fd02913ac --- /dev/null +++ b/8b7178b88b/global_step84877/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:559d64433588a7792fc27904397082e7d8aceb4b46b6d4b9ca0a4ad1f50a8229 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_13-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3cad9564f4ba27d1630ae0c4c5d598c2e6511e7 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2833ffd91dc9ebb0794c99a13c96195a9e3b17534cbf7e2f7c15a028e6384bbc +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_14-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88176bd434edbcd0f5bc1f1975ecdea2ceedc12f --- /dev/null +++ b/8b7178b88b/global_step84877/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2ad2fe44910c22d4e422ec7d07ab038e59dbda20545a1cf25c2b267044d903c +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_14-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae9d78db63f75e17340964ab5f269f1efbe5037f --- /dev/null +++ b/8b7178b88b/global_step84877/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b707c65de821cb700bba6c205f707b74f33b322c1baa02f0d9a720e324bf92e2 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_15-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86dc054c519f8bac17dad13eb9e58b1a3d1515fb --- /dev/null +++ b/8b7178b88b/global_step84877/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e01bc4afaee38531ef0ab8932144c16c2a5c76e2613056492358f32eead7ff7c +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_15-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74104438f3135d263403664387f5241699c3cb82 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dff2a510e0ede6c051206346e2e8419bc6ea901a3bd1708dc1fcc87b6b1f4d5 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_16-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0341e1340691c6af853f08a953c5910e9ef6dc5d --- /dev/null +++ b/8b7178b88b/global_step84877/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7c664bf920a202addb7f378ab1300053f6d41daf39500ec94c15bf025f602ff +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_16-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97ad2ee48d064f1ff75b7a364951d8a0af318dbb --- /dev/null +++ b/8b7178b88b/global_step84877/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82570bedb50a0a08284be59105fab9bf383f5d40f107bc9f66ab2cd0e4f2d2b4 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_17-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c4f3a55f880d5639dc0a65f2de74ffedae658f0 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa0361e068f976ffb88d391347001678fc9925b8033af787a093502978c974e0 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_17-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01b2338a7547c22a2bb028bc6a17aedbb2e541c5 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:021bb31f30251e5cd673702b81b617455ffd14718c57447270a17b3fe32afa3a +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_18-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71648272b518d047b58b24cdd2026f93a1d68586 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e434635bbb1a82222da7324268951da9393400e6e12e995524d9f1601a1e925 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_18-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7447ada1e71a3ad39e64de6949e6a334f22e21b --- /dev/null +++ b/8b7178b88b/global_step84877/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4df008c0e6de468b82d796b271e0c334a7bff0917ae7aa957fcea014faf5736c +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_19-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d39bd3e2955700890a1c272c501d99ada085a6db --- /dev/null +++ b/8b7178b88b/global_step84877/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0861cbccea09e500d13d729d2e7401f867a89c8d6f4f6ae67aed6da0fe5ef985 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_19-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9f6bfce4bf5475195695c25d91399c7c7b8532c --- /dev/null +++ b/8b7178b88b/global_step84877/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a584c8cef9e7650463ac6f7393f9dead9e3a62b18fe86e15c2038056e030b079 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_20-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8954c4871df3b87824baba1295f74fbf04b5786f --- /dev/null +++ b/8b7178b88b/global_step84877/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2976238b17dca0e743df2c58a5e16a5637494902b59f628cb5dd1358972f4bd +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_20-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8199ed6ee1424a5df44f2b98601311cd3b413f9c --- /dev/null +++ b/8b7178b88b/global_step84877/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72f5e27e06a0da47f502ee71556741721b4f3488c5924b2c35ea4bc8bf67cc09 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_21-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eec2aa8bbd7a58d9ad5854ac59762a1006316f02 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:856036540d641f4f245bd456ca41981b6030cb0c42d235aa602952e85b2deb92 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_21-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09017ffd34716c023e3ff13fca52a01b964d5614 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:069e007b4a3f9cd5a1a420cf9bc3987e3ab2587e10cfe769a402316237e8ab5d +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_22-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44292f099a0d409855f3d7d9cbc79509f5d7f1b2 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66bf48cf98b818069c16ac71a6d519e7b84c862bd05bafec2f0f2067230b60bc +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_22-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1e585649495f3c6ecb405acaf496be2f2c05987 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f3668078a6800dc5845f89ddf23e2a19280860bc45ab336075ad42793f68bef +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_23-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8e39a49eb8d1037dbff22979fea9454e12180b6 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e78157d2966df88a449d1b918417772798ff63f37df10a4b483767a98fb76a53 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_23-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fb4324b19edfb83566eab1c0b6364837de0f67d --- /dev/null +++ b/8b7178b88b/global_step84877/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:871d85bd80cf466565907d2485495a129a3b0d7152ed1d9f518d5674eb2bf456 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_24-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd3dd682c0876a3f7fea3c7f0441c42f4927efd8 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eab217b426ad12dddd59e3704ce299b2153a74c1a241603c2b3cae8bef74cb0c +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_24-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e31825e9b18b1100289011b2d8ba8ee84371a9f3 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:988dbf07547e4974eb457146ed5b363db0a39f539a317da1d654bbfd211eee84 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_25-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d726ca1e1f50eed15bff11e52b3c31011d1ce2d --- /dev/null +++ b/8b7178b88b/global_step84877/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f1e757d787e30fa810eba37e9ca441b2b1796df85bbd21f431ca41ecfc3f2a5 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_25-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87cc03d290e4aca9f137e84c80c1c1c627766044 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61efc19f0ff1abd013c3c63447eadeeb9ca64909599bfe65c920de75157088bc +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_26-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c63674bcef4de05ed0500117c26616f569b8df2 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b24fbd6b1e098627202a951d871987ebfa1cea09ea874316c7ab20b16f6845a +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_26-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..344b5a1f0d54b4c52e9d1e24e9082d0fcd82ef94 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e55b4dde0ae1733fe6245ace14071c03c899fcc372f4dd302aaea61ebd63e700 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_27-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..286188e8a83f0265e64a87e3d97d8e4be733d43c --- /dev/null +++ b/8b7178b88b/global_step84877/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:361668a3a0647f7d092c77d6d3673c3ade94a266898a0c4d4628852bdb38702c +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_27-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfa1fbeab949354f5443db1d9e9f0986db56b7ed --- /dev/null +++ b/8b7178b88b/global_step84877/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ba66185f619359d38e4169962f24bf71d53a019fd00667b1d357a04df7e528f +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_28-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..582deeff77b04921704d6f5d515b63501f847526 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:454b5a9c49f4275c8080232ed77b8e92e131acc5d561cd8d403c40f75dc083f1 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_28-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..418e7f191a71a0cfad3a1dd96ede867af1712888 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86414bb572600d063b4c76c46acd9c3dfab9d594d3004da570f75dcdd90e6e70 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_29-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e5caf4e84b14d4772f727dfaccdf25c08695adf --- /dev/null +++ b/8b7178b88b/global_step84877/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9113a770b5c3d76fa464f7398feeec108e7fe187e0c472632218da0dbd1db513 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_29-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fad41ec0fb2be224a01472f655896fec358a3e6f --- /dev/null +++ b/8b7178b88b/global_step84877/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8d43d9d12596e9ea3c0cdfa408cea525e28f6fd8ebd854925ac5f80ccca31fe +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_30-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6acd76365254b1bd62f654bd84bc8be0e127eae --- /dev/null +++ b/8b7178b88b/global_step84877/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cbf7ba261d6132b6b5d872711071e89333868d55759e69f980ac4617b598e4b +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_30-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea553ea19dab107d7bd4865c042bee6a85b87987 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a2286a327676838ca9cab6212189e87ce04deeca2bb48b14ba2905acf612fb2 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_31-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ae45d244d2baf4387a229ef79a51f432b19f8dd --- /dev/null +++ b/8b7178b88b/global_step84877/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dbbe891546bd94128ca5f873429e709c08461ec379b48d86be9e12c6a08d606 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_31-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..480329f280c260aff152fb012fe5af540a0883bc --- /dev/null +++ b/8b7178b88b/global_step84877/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59edb4b6e0a8b4331c57aec3dc8d69c92390f114809a840c586221acf40cc52b +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_32-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91445e2279397befcc62b08f6161048e226e57c9 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7a3102b88dc7f38c7935a1497c23d64294150c9d31bb6b1ce1bf554acadb585 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_32-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ce30b063b5a41b8a255a18739e3318bc1d111f0 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f96ec75df8a6d92cb88d7e974b0e3e4ab8bbcaf66ec2744b4a31477425c55936 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_33-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31d36895074bc375813cce75bbe3d6431ca48f2c --- /dev/null +++ b/8b7178b88b/global_step84877/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:428ae30b2ce1daf1bbe19f30e6655ff8d283e3bffd9abc48095a609d4550c64e +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_33-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77e6ebef0a063ae825f547de13220dcfc76ad2b4 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1d588f5132bb6ec7041630b9b5791a4086efd34522149643fd596b81fa133de +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_34-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8111893abf4bcd8fc0fa8c0f2ffd79eb257d461f --- /dev/null +++ b/8b7178b88b/global_step84877/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd4d0640e1156b59cbfe2270f23c837ea3f436b732842a6be4efa630e856a3c7 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_34-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e438f874127bd62366120c5afa704e0ce579981d --- /dev/null +++ b/8b7178b88b/global_step84877/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fc95d2e17587402e99195ec4571dbe1bce976380027864572acbdb4fbc2ecab +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_35-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ded2a1e67430375685377f5f35f4c05661fadfce --- /dev/null +++ b/8b7178b88b/global_step84877/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca092d0bb3f7bf127973f67358fbbca6921f0322daca5b9d790027e272222655 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_35-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d03d7816e323249ac91d8f716bcdec16524471e6 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fd7289f8ab66a80288efad0f5cd0d0328d00b72fb4689561d65bc03662da760 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_36-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f7feb799c2d0cd06762e100f4eb5b063e63a983 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78ea2ef65a91d8e7ba3a514b50af7782d16e3149e249e15574157189c2d9b6d0 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_36-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa81dbbfad31c5f1d06a341af3219799031bc80b --- /dev/null +++ b/8b7178b88b/global_step84877/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6e9aa8cf4706b0af36489724da614bdf2f9a97bc01cc62452ba3d925e9f9308 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_37-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..475d338bd749324ee50e9908bf43e3d1d2731f8b --- /dev/null +++ b/8b7178b88b/global_step84877/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a2ced820007f1b03834c2b1ff99d285b456874506d96e8e64061b0475fcc9a0 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_37-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41e915a8bc0debc79c2af776f98197cc1d3c754b --- /dev/null +++ b/8b7178b88b/global_step84877/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1176611e1743a7eb391845565d8a1c0795077daedd402873055f12c255fc238c +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_38-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fe7330890a4969179bb99a046a56f5c5be28f68 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f0a6669b7f68bee93c3a7240ba05102c62ecc59d46fcdbd72089d9aed56c086 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_38-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6304d8a5a27501c8ae805d2cad2b126576e3d548 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec69a5e4fcaa2555ef09fcb951ba066cd57a6fe1135c031f63d9853c9b87bc62 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_39-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_39-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..750227d6cdba8f868d86d283877feb290fcdbc76 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_39-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56cfb8ebd7efe79beb8097813546e424f607f2a6d158affcfff7fb19a2a1798 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_39-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_39-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c67b6aaf9e211962f69fbe1309c2f605d2f20d8d --- /dev/null +++ b/8b7178b88b/global_step84877/layer_39-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d69cc99400d478c56a482161b7cb7ff935468431acd960ade4024f5a4ab4e3a +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_40-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00d1562c846f11a7f40ec89197f9b6f2aed6588d --- /dev/null +++ b/8b7178b88b/global_step84877/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beebbce3f357ef653fc2d5732bd37c8d33c00c03f6d23736b90254ce603586b4 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_40-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42384c9750f2cb7173b14cb1db783caf293912cc --- /dev/null +++ b/8b7178b88b/global_step84877/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74b5d804a5ae23b09b1e21ac40030207ebf467c3fd2cbc96309859937081a4ca +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_41-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_41-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61af31b88d994a5ba20dbca8a33d9e018aa82bb5 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_41-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43c8220fadb3bfa5c403544181fd17863860afc023c75b5d6a63e4d5894bbdb6 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_41-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_41-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e2c6d2484d70e6c5a96bbcadf7cc51f138f4fb4 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_41-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8085866712b79fa536825799dfef2cb62e3c54280223deeac16f664b78d1122e +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_42-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_42-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e07bb9a81fea9c755f41801b865beca7aafe232 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_42-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443c7409e01ef4467e3fe7c363ad4af6eab5ca8508db9cb6d4c997f05e9cd2b5 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_42-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_42-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4199b7f34bf9f80bae5bc8ee7ab669e844dadbdd --- /dev/null +++ b/8b7178b88b/global_step84877/layer_42-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc630755d0999b46a034ce9071038b87baba2c801a11e6ae12644184789c9350 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_43-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_43-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98058d8f389e48bd8b6420a2f579819aceba787f --- /dev/null +++ b/8b7178b88b/global_step84877/layer_43-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58e441b427e91ff989cf48771b0b0395a5bc27e22e346b55b98c4272191bafa3 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_43-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_43-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e8f8d60bb6caec6d508504fa3e1055477ac9e38 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_43-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f7b65cf1706bc5070bfc7363f240ecff4719c306f85c5e042f4de760e76c4dd +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_44-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_44-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df9e8cda144994976757b137872a4e3fd82bd55f --- /dev/null +++ b/8b7178b88b/global_step84877/layer_44-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa5919e38d03e9794def85ae8569244b4572bced0b1510c6a7943863556f7170 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_44-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_44-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de47c61b593ec8b56fdc1a3e646d7ebabb5cfb08 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_44-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93aee116f8b36dbc940b75f4255ef07967caf75b8b4745bb70b7a309de019d77 +size 201408771 diff --git a/8b7178b88b/global_step84877/layer_46-model_00-model_states.pt b/8b7178b88b/global_step84877/layer_46-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5c56cff97d17a2a3d1efda9196146176262a854 --- /dev/null +++ b/8b7178b88b/global_step84877/layer_46-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8682397f9eb74d2d2780f7cdbc4c1a53ee4553a1e0f870502f3d29477884286a +size 17603 diff --git a/8b7178b88b/global_step84877/layer_46-model_01-model_states.pt b/8b7178b88b/global_step84877/layer_46-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e588511802cc34dda79ecd53647758eedd310dad --- /dev/null +++ b/8b7178b88b/global_step84877/layer_46-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:346762d4c6aa1b16ca14c01d41bd10a8d4e9816df99df4a39dfae95645fe4b48 +size 17603 diff --git a/8b7178b88b/global_step84877/mp_rank_00_model_states.pt b/8b7178b88b/global_step84877/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0885013cf8c56c6351be59ef5936a2650f5b6e61 --- /dev/null +++ b/8b7178b88b/global_step84877/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35980d4299231f4e15b895061702240fea986debc5aa7e0679be5ea1895ae475 +size 40115 diff --git a/8b7178b88b/global_step84877/mp_rank_01_model_states.pt b/8b7178b88b/global_step84877/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f4ee630dbde6015cc6b0687a1b6a10126b08a89 --- /dev/null +++ b/8b7178b88b/global_step84877/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8dbbbadea00efc625664179ed3caf988bd7bd0ed79007ebafb07c3f74f8e769 +size 40115 diff --git a/8b7178b88b/global_step84877/mp_rank_02_model_states.pt b/8b7178b88b/global_step84877/mp_rank_02_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5226d6e7e9c81c7aa87fffde2539a7722bbad3f4 --- /dev/null +++ b/8b7178b88b/global_step84877/mp_rank_02_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4e079248f47489f2ee2e06564311aa93a072188e9e28f31327c34aa75e727f8 +size 40243 diff --git a/8b7178b88b/global_step84877/mp_rank_03_model_states.pt b/8b7178b88b/global_step84877/mp_rank_03_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18591a0de07a1738b6f59d93d06d0cd80ff12bc6 --- /dev/null +++ b/8b7178b88b/global_step84877/mp_rank_03_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83b430e9fa85737757f859269dd2028df58ce23f7a7442769cdd05117c28bdd3 +size 40243 diff --git a/8b7178b88b/transformers/config.json b/8b7178b88b/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..eadf3eb13cecae9db1c34cde4f4d373a9d0fe00f --- /dev/null +++ b/8b7178b88b/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 4096, "n_layer": 42, "n_head": 32, "n_inner": 16384, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/8b7178b88b/transformers/pytorch_model.bin b/8b7178b88b/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..eb3971a427d8fff99bbd7b241e3adf6f54a70f51 --- /dev/null +++ b/8b7178b88b/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a765505f0c0a6133fb8c17345d1356ec2aa35b709dfc98378fdb7a37b47f4344 +size 17698351197 diff --git a/launch.sh b/launch.sh new file mode 100755 index 0000000000000000000000000000000000000000..6c3445845a5dae614feb4b8a1206322cd7bd9050 --- /dev/null +++ b/launch.sh @@ -0,0 +1,53 @@ +#!/bin/bash + +# Launch script using torch.distributed.run(). Used by slurm +# scripts, don't invoke directly. + +# Samuel's fix for apparent error in SLURM initialization +if [ $SLURM_LOCALID -eq 0 ]; then + rm -rf /dev/shm/* + rocm-smi || true +else + sleep 2 +fi + +export NCCL_SOCKET_IFNAME=hsn0,hsn1,hsn2,hsn3 +export OMP_NUM_THREADS=$SLURM_CPUS_PER_TASK +export FI_CXI_DEFAULT_CQ_SIZE=131072 + +# debugging (noisy) +#export NCCL_DEBUG=INFO +#export RCCL_KERNEL_COLL_TRACE_ENABLE=1 +#export NCCL_DEBUG_SUBSYS=INIT,COLL + +module --quiet purge +module load cray-python + +module load CrayEnv +module load PrgEnv-cray/8.3.3 +module load craype-accel-amd-gfx90a +module load cray-python + +module use /pfs/lustrep2/projappl/project_462000125/samantao-public/mymodules +module load suse-repo-deps/sam-default +module load rocm/sam-5.2.3.lua +module load rccl/sam-develop.lua +module load aws-ofi-rccl/sam-default.lua + +source venv/bin/activate + +MASTER_NODE=$(scontrol show hostnames "$SLURM_JOB_NODELIST" | head -n 1) +MASTER_PORT=9999 + +echo "Launching on $SLURMD_NODENAME ($SLURM_PROCID/$SLURM_JOB_NUM_NODES)," \ + "master $MASTER_NODE port $MASTER_PORT," \ + "GPUs $SLURM_GPUS_ON_NODE," \ + "CUDA: $(python -c 'import torch; print(torch.cuda.is_available())')" + +python -u -m torch.distributed.run \ + --nnodes $SLURM_JOB_NUM_NODES \ + --nproc_per_node $SLURM_GPUS_ON_NODE \ + --node_rank=$SLURM_PROCID \ + --master_addr $MASTER_NODE \ + --master_port $MASTER_PORT \ + "$@" diff --git a/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674203794.nid006729.92782.0 b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674203794.nid006729.92782.0 new file mode 100644 index 0000000000000000000000000000000000000000..93819f2844ed16b05409305935a51e244e0d53ea --- /dev/null +++ b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674203794.nid006729.92782.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bacf5eed23c12da8ccbebccbbf80c0fcdd6281c5f2ec226036f97e60571c0c9 +size 40 diff --git a/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674206058.nid007225.128328.0 b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674206058.nid007225.128328.0 new file mode 100644 index 0000000000000000000000000000000000000000..e2777de696c12b6e18eaf488c5204f1265e0f0e8 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674206058.nid007225.128328.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf5e9b8933b6f3271c80d002d87f3a75db1292a5b44e44926be729a1d8d4b5d0 +size 40 diff --git a/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674206530.nid006729.113668.0 b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674206530.nid006729.113668.0 new file mode 100644 index 0000000000000000000000000000000000000000..7c20c78ff41b723deeec2e185161cac7e1f04c6b --- /dev/null +++ b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674206530.nid006729.113668.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:616d893113fe53e1b6867bd91e95d3aa1fe35bda3e4a02afa70fedcc871a360a +size 40 diff --git a/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674208882.nid006729.2134.0 b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674208882.nid006729.2134.0 new file mode 100644 index 0000000000000000000000000000000000000000..e6f73ba357d6a0e290df1b1304c1eef732f5bc68 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674208882.nid006729.2134.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23f231af7e285c0c5f4bbe8ebb9176ac197f6b61d3bfcd4fdc884afb99187019 +size 40 diff --git a/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674211218.nid007225.28612.0 b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674211218.nid007225.28612.0 new file mode 100644 index 0000000000000000000000000000000000000000..decf34d02b73fcf160a187c295b40497c058b967 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674211218.nid007225.28612.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:736afcaa0967c993f784c8f4bc4c37e25159f8b5513964a944e929a4b60d33ae +size 51168759 diff --git a/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674383961.nid006751.102299.0 b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674383961.nid006751.102299.0 new file mode 100644 index 0000000000000000000000000000000000000000..78368f2defb56b18df393d23cd2ca289c689d99c --- /dev/null +++ b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674383961.nid006751.102299.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:741b03719ef32f41a5d641500d960f1859a47716ffd53e9686366c0395aa1829 +size 56297746 diff --git a/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674556861.nid006751.116605.0 b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674556861.nid006751.116605.0 new file mode 100644 index 0000000000000000000000000000000000000000..fad2861a9038690b7a57b09d2f494198f5d534a3 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674556861.nid006751.116605.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a5bea97d9f5b47649783512a5fcc29bf9fa2d1c018f685d39f7f9e0cae252eb +size 40 diff --git a/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674634575.nid007011.29628.0 b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674634575.nid007011.29628.0 new file mode 100644 index 0000000000000000000000000000000000000000..58d71df8f990f5df5811ddf33739888ec8300eb8 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674634575.nid007011.29628.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca477cbdb08b6875c5a6d2fde782039df9f1c0bb8d54fac2fa47793d8b3577b8 +size 21011036 diff --git a/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674910929.nid007239.64489.0 b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674910929.nid007239.64489.0 new file mode 100644 index 0000000000000000000000000000000000000000..fd690bcb61e46594879de2570d85727040d40f56 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674910929.nid007239.64489.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29af0f9524165eae4c0c67861c8ab2c9a09eeb2a5f5fc061c13d2d5d093a9ab0 +size 40 diff --git a/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674911527.nid007187.101727.0 b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674911527.nid007187.101727.0 new file mode 100644 index 0000000000000000000000000000000000000000..2491eaa035a652adc6c5139422ac9e3fdb1691f7 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674911527.nid007187.101727.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20efe046a9d1b95188e020b5b4e868e6a10893f6573458270b95fbdbdec61bb5 +size 19366747 diff --git a/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674973159.nid005175.1867.0 b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674973159.nid005175.1867.0 new file mode 100644 index 0000000000000000000000000000000000000000..975b1894f6f5bdd91242976e3cc87eaf018aa7bd --- /dev/null +++ b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1674973159.nid005175.1867.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b1306857efaa6e0ec9252eeae8ccfa01550471c7c1aeb1d5e8b4ff1821851c2 +size 17790459 diff --git a/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675029058.nid005411.15811.0 b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675029058.nid005411.15811.0 new file mode 100644 index 0000000000000000000000000000000000000000..8443168b5bce49617691c7810f463e4d2d02f7aa --- /dev/null +++ b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675029058.nid005411.15811.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57285871befb28fa2f3eb1d9ad37d42c7b01e1d7fb16375638bc552d44d9d10d +size 40 diff --git a/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675031498.nid005411.33942.0 b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675031498.nid005411.33942.0 new file mode 100644 index 0000000000000000000000000000000000000000..0091eab60fc98bf3a02460b5aa41ac7ab932c2c1 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675031498.nid005411.33942.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4efff15783cb3574253d82343ee8953b9bf6672be211c2f7571fc7afea27a855 +size 40 diff --git a/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675103508.nid006891.100846.0 b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675103508.nid006891.100846.0 new file mode 100644 index 0000000000000000000000000000000000000000..e133618226465c4aff4ee4cb15fe2db6b98cacc9 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675103508.nid006891.100846.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01d8ecc7a1c79c1e1977e70c985ef061a398b8c43959915dc80bf09c6a85378b +size 40 diff --git a/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675106604.nid006537.25900.0 b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675106604.nid006537.25900.0 new file mode 100644 index 0000000000000000000000000000000000000000..efb7e898da6e5c1e4e56f7b9da763c877d8a8280 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675106604.nid006537.25900.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4be66697250ac099f4fdf2a0c0725ef8e7ad178862cdd2eecdf461ef5dd65ef6 +size 40 diff --git a/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675106825.nid006315.82648.0 b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675106825.nid006315.82648.0 new file mode 100644 index 0000000000000000000000000000000000000000..1d90df32f1f13f5abc98f63aaa285c41b0e4ef1e --- /dev/null +++ b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675106825.nid006315.82648.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad31e898929de631549c4d0fb841777ed51d8001dc0ec0c018903213e5137576 +size 40 diff --git a/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675106999.nid005895.95108.0 b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675106999.nid005895.95108.0 new file mode 100644 index 0000000000000000000000000000000000000000..bb52ad917a2a950e3610ad4737a1dc971bf9dee4 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675106999.nid005895.95108.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b9adf6814ec47ae917a821aec95b280b8eccaec0333a74f7f7a8e5bef037f70 +size 40 diff --git a/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675107149.nid006751.78763.0 b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675107149.nid006751.78763.0 new file mode 100644 index 0000000000000000000000000000000000000000..21a22273d4409ea6056ac4c7020a8aba5abaf884 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675107149.nid006751.78763.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9413d870d388d36af10ff53d43f281e893f7bd59dd0deb79e911d4b0460ab586 +size 40 diff --git a/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675107398.nid006751.85117.0 b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675107398.nid006751.85117.0 new file mode 100644 index 0000000000000000000000000000000000000000..a50c577264d2b58d61a200beafb07019177ef952 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b44boscar/events.out.tfevents.1675107398.nid006751.85117.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:023e07735f562cb2ef8e716927ed65cb4478805ee2ab0702d5b450e28ffa6eb0 +size 40 diff --git a/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674380796.nid007183.117296.0 b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674380796.nid007183.117296.0 new file mode 100644 index 0000000000000000000000000000000000000000..c8b2b132d018c790a5b1e0aa0884ccb173b026db --- /dev/null +++ b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674380796.nid007183.117296.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48e955f721b36212a37bec33a1e1a13d25af13fb611ea5c478796bd03dd73f11 +size 15540422 diff --git a/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674439096.nid006481.105402.0 b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674439096.nid006481.105402.0 new file mode 100644 index 0000000000000000000000000000000000000000..d4c1836f0d39cfe67811b300583842fa65abe4cb --- /dev/null +++ b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674439096.nid006481.105402.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:764d7ad376bbb7aa33d70ba6daed16c36dab6c7e517cc964151bd7691f39476f +size 40 diff --git a/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674441446.nid007183.63440.0 b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674441446.nid007183.63440.0 new file mode 100644 index 0000000000000000000000000000000000000000..e64b5458f7a9e2fea65750de98892f0419a38413 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674441446.nid007183.63440.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7e6bec4745a38840f18cf2b2bf438da944f3e2cc0e5fcb0b34d5985d6a93eb0 +size 40 diff --git a/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674443805.nid006579.52071.0 b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674443805.nid006579.52071.0 new file mode 100644 index 0000000000000000000000000000000000000000..44c4d4914d8f024622a1d807ad2791b7582377da --- /dev/null +++ b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674443805.nid006579.52071.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc5ab66d940ea47331659154965b7a44f5cda21995db252cdc0a1858de59cac9 +size 3273287 diff --git a/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674455096.nid006533.33147.0 b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674455096.nid006533.33147.0 new file mode 100644 index 0000000000000000000000000000000000000000..b42371089f581c96a02d68c1f39d0110064ebb72 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674455096.nid006533.33147.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:847d2f459eddef5dbd649a71afb72106e14d81d406a87ef79db93e1fe41471a0 +size 56001039 diff --git a/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674627909.nid006885.49592.0 b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674627909.nid006885.49592.0 new file mode 100644 index 0000000000000000000000000000000000000000..96c2308e4225e26df37816c6f2ec3dc449178ef1 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674627909.nid006885.49592.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45a1e7e1d8cc794d871989c7f7972c33a7c05d0f97525006ae53c80aa8ce6848 +size 40 diff --git a/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674628514.nid005873.80339.0 b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674628514.nid005873.80339.0 new file mode 100644 index 0000000000000000000000000000000000000000..08564bdcfc01451cb6da08cbea31108e2b6a23c9 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674628514.nid005873.80339.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c146be7fabd34488e07285551fa47379be84e3d9c034ca43d72cf0789355b3e5 +size 34081817 diff --git a/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674801355.nid005522.120370.0 b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674801355.nid005522.120370.0 new file mode 100644 index 0000000000000000000000000000000000000000..6be7e8f8b1a6fa014836bba02be837d91eed3fed --- /dev/null +++ b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674801355.nid005522.120370.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85580d1e8efe5e1289f44bbbf7346d3b51a6bc4d071fd716a11a5b8adce8aa87 +size 56173394 diff --git a/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674911187.nid005313.87724.0 b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674911187.nid005313.87724.0 new file mode 100644 index 0000000000000000000000000000000000000000..917bdfc4e705cfa4acf17ea04fd3c95cec50fc8a --- /dev/null +++ b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674911187.nid005313.87724.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd27d67e80c72145e67c7a0a8192f3acacf35d768caa0dcdd14127b08cc5ae92 +size 20562 diff --git a/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674911783.nid005313.94921.0 b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674911783.nid005313.94921.0 new file mode 100644 index 0000000000000000000000000000000000000000..67e7a3f2045daecc69815b6bf1ef8ae13cd47b30 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1674911783.nid005313.94921.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54c44c49667f12dd7dd3ec232f9f166de30ec4f3ec0dcc544f77a5f35bf78554 +size 35781939 diff --git a/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1675022797.nid005411.95066.0 b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1675022797.nid005411.95066.0 new file mode 100644 index 0000000000000000000000000000000000000000..5213a4ab19fe08706c21acb94bb252e524f51ec9 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1675022797.nid005411.95066.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afdffbb8781da757fefcadb9ccffc3b4982f816ca864b8b5af8d2a33842b8f6f +size 40 diff --git a/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1675024940.nid005411.112332.0 b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1675024940.nid005411.112332.0 new file mode 100644 index 0000000000000000000000000000000000000000..84b1169851bbc734a6adcbf995e484239aa86d8f --- /dev/null +++ b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1675024940.nid005411.112332.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3adfa65292ab77547fff89a5217ab22c801e58b33dbb8076ae0a1074464a292 +size 40 diff --git a/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1675033868.nid005411.55129.0 b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1675033868.nid005411.55129.0 new file mode 100644 index 0000000000000000000000000000000000000000..abeef89980eaab90b83af82732a05aaf02c57825 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1675033868.nid005411.55129.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26b100066c13cbf5949a0c48c08054f275883804fdbf59cf286f611503d9c107 +size 40 diff --git a/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1675036187.nid005411.75606.0 b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1675036187.nid005411.75606.0 new file mode 100644 index 0000000000000000000000000000000000000000..a055019c835783c395ccedad7c67e6c9ae26c092 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1675036187.nid005411.75606.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55a28bff32525a878bd1b5b964076690f4b33ad51b5f0a67776d22072c2788a1 +size 40 diff --git a/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1675038769.nid005462.46292.0 b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1675038769.nid005462.46292.0 new file mode 100644 index 0000000000000000000000000000000000000000..c677bc8afab0f4f300e2dfe6dfff653a51ba4edb --- /dev/null +++ b/tensorboard/tensorboard_8b7178b88boscar/events.out.tfevents.1675038769.nid005462.46292.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e530257d6b2abab7bbf73d27e894055336bebc1934ecced3cbfa72faa5c7a6f +size 40