diff --git a/.gitattributes b/.gitattributes index de55ba550880b81c3070e352a1aacf35dda40d97..d4ef60d28f97d3c94e8a69bcab2b56fd2e479531 100644 --- a/.gitattributes +++ b/.gitattributes @@ -154,3 +154,27 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text 8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text 8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text */evaluatuon/generation/examples*.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-web_nlg_en_PALM_prompt_0.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..464e16938e466ee4f3b6cdea89b21a141f42f5b4 --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.4214863735405607, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.029154609162010323}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.08388349369737222, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0028741362760589364}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2839223617284565, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005264418568471245}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10879688033992795, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021627779616647516}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.04057930751764507, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002047816625134428}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.13506279227711254, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0032130647312794175}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05055369077754123, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012930809657985872}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.08041455507307416, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002796739709192279}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2738666536323073, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.005085678508176572}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10393401018258999, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002007764403266908}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07977634567972974, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002805961856125458}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.26749167398935675, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004882015301399527}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10270283885145984, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002020111493088052}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-web_nlg_en_PALM_prompt_1.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..072f4288b5bd7434e73b4c0ff3123b81b7eb52e2 --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5958530874585899, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03649262475380295}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.13749267610186958, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004325878829249963}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3241716808952326, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005125119098986173}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.16359576779434043, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003809967310568941}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.07246358161159391, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0029673895627135506}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.16876397664351184, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00367859006299185}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.08433674778206289, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002591174609210514}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.12393180075905823, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0037992843733980434}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.30308740481864604, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004697897076217226}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.14881701677232517, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003277859581563782}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.12662324522811608, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00387820514144903}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3067988164213401, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004754578958904846}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.15170700107447863, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0033575398797432874}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-web_nlg_en_PALM_prompt_2.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..b12e2c0cdd3c6cb61dbd46dbc4c705cba5f7cd16 --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.7632123296691333, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.038667647524407975}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.17619531326285107, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005080542288823818}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3742085058586801, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004920653945655996}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.2022385311781214, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004271916206549367}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.09658792599721289, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.003611262853993622}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20162933402440936, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0038801577073926965}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.10803467148430693, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0030612514779265803}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.15692981536908263, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004446297762122498}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3484780480719596, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0045553445266088635}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.18252899170611903, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0037263532749030616}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.16217269474751653, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004631557820535045}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.35330840347834674, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004610857396095154}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.18711611785244323, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.003848891104616288}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-web_nlg_en_PALM_prompt_3.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..97323ea0af0c6b5ac56610d2dfdf8eebb4aa0f75 --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.9207133879279265, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03255931768193071}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.18377058302813723, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005253580997340217}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.381271206422023, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004890766475780684}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.20867536510345913, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004354382473584997}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.10294612127680682, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0037309770662019557}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.2060814488662053, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0038997213229875847}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.11272429502619766, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0031312620749979446}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.16232375389423376, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0045761676741338285}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.35147344800261143, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004418957418369871}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.18616032806880206, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003714239240740623}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.16801891503402527, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004781137280246318}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3573456612646077, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004500705918880425}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.19151809123693445, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.003873742236641197}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-web_nlg_en_PALM_prompt_4.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..36b72f5264e2d0f478a7c347858e4133f68eb930 --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.9902518578876233, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.040737732761129415}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.18789368573901274, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005285851879717852}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3899093270922249, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004962887842702003}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.21290146130579965, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0043700834724458276}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.10560975558011194, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.003731700714381224}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.2145796483953565, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.004035868026365014}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.11683410537192468, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0031833984768610346}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.16382625310518403, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004486884267673038}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3597071518828505, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004521922524975513}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1890303353482411, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003700023042470156}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.1707530708743364, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004732141735621611}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.36629613801895733, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004591525609735619}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.19508857877285685, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.003865606407547543}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-web_nlg_en_PALM_prompt_5.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..553b94f6ee3cd4a80602612e002509b1b2d74ca6 --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 1.0873761263949675, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03934330697010386}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.2117037418048869, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005797595530762211}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.39911584774379655, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00498148260658174}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.23018635133450477, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004612080716063762}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.12132204155512089, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.004137193433006742}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.2209500964153402, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.004025388576844993}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.12701615271509778, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.003293666322506656}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.18406790377006843, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004937322660278917}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.36561941279365967, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004496892763588926}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.20292345789497096, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003854003762475144}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.19092590715178714, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.005162190150819128}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3726247925460039, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004574209186658482}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.20912697515193987, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00401671896906783}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-wiki_lingua_en_tldr_en_0.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..02ac055ab94b4efa8c20250eec43c22512e44929 --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.14513591635070752, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002933831212103272}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.19891787194668262, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003187558635297779}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1485707360665655, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023637963366588163}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.029907874227091444, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000921657729333574}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04649017309040178, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014882369637529544}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03346604327851081, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009887781706946746}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11668487543384909, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002498896390227391}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.16129272420830681, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002571624720811961}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.11823159104307632, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017829954318414592}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.13518764121791138, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0028124634604811717}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.18445870962398936, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0029688108031568614}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.13755330088318402, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00219534310275043}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.318732566456423, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.13881817798189033}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-wiki_lingua_en_tldr_en_1.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..37e7ea056c736f16c933ae416b8f58b759fb7dee --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.248970781629388, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003874261949118977}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.20254661208456856, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028554953044439015}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.18955083016621427, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002379156871875284}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0689782299271333, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002313495667945766}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.049284004115414136, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014678263918321242}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04746965955266556, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013357687513664974}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.19495136652936196, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0032222442707770895}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1564134625395888, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002249411692052382}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.14594622749474678, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018424648214888}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.23507901615131913, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0036892088805215145}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.19138092032456272, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002706865345022287}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.17879643931529124, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022381896082302615}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.926117660825783, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0707920058779335}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-wiki_lingua_en_tldr_en_2.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..4e8b01ccdc289af9ccea55dee77f593e60e19e15 --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.35679011396950494, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0039535541787012966}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2525122163812022, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028104769002719686}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.25402066807919726, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022729602698409765}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.11566892110217673, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0025968459819964438}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0758485270748662, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016494845495132536}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.07776422929510499, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015470867437394145}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.2787485396392972, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00333060867857478}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1946844152208185, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002269590023349728}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.19606027302517406, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018502837344183064}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.33780149114906943, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003819320386381285}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.23865291484527454, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027000637562272383}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.24005412545885543, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021905454232920693}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 4.482664241932101, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08212180996103731}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-wiki_lingua_en_tldr_en_3.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..4895d8b74db1c4b7260edcda581babe883a3b07f --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.3061484539454385, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004423098151670539}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.20167165147009586, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003037208327664155}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.2113115990683054, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0027547750855983046}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.10017174467185903, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002669280506981759}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06128388820701079, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016275016915406385}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.06469489115245816, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015394791419511076}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.2427018640988824, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0037099343074804333}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1573050958528797, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002452551923134493}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1649989495768865, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002208842551468564}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.29051399119634647, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004266689720705603}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.19088557384190263, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0029163289376507914}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.19989739105994972, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0026343775714049306}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.0072655046058805, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09596043858220096}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-wiki_lingua_en_tldr_en_4.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..c4a770cb4f711d76eac90fe69dbca21240a9adf5 --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.09734210523837013, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003585657330962349}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.06338401184872311, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002461970340537986}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.06646559577850898, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002389468792903583}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0321171525149136, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0017883302892353346}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.019779405420936473, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0011693482689711905}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.020767091534965167, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001088077081953597}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.07721998831670598, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002911924342353414}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.05016221089779053, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.001994888739662481}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.05241812699049824, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019162468765830335}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.09174287392107108, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0034181860926286}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.05945776168044872, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0023246003955623533}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.062355467850168954, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022529742622293867}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.02961687910857089, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.00667797537003518}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-wiki_lingua_en_tldr_en_5.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..49f10d711b9ecf7b628a2a606cf0cdba2b6e9310 --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.01662223836437527, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017200192815433816}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.010369987242786843, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0011350821871749513}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.010515163702672926, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001060191799945764}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0056669762870846345, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008937346232787428}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0035137406087487875, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0005888971524329703}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0034609320209794962, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.000506080127090741}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.013605527079975888, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014624549576253666}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.008580131540181942, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0009742333834018987}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.00858027237742148, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0008896522724178397}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.015819080798652796, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001649211944475785}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.009938412449545603, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0011052383189021134}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.010008632917285501, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0010183013884774283}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 5.0425595242130537e-17, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 5.828914972997529e-15}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_0.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..1504cf4b1362cf5455a14fa5bd8f482b431001e5 --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 3.727703428672484, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.16225275145292814}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.15580458811715164, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004522055277902883}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.16212105310140335, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0038770863196531777}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.11677483396146617, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026043522717618377}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.08759078800738393, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.004060781916683637}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.05918434764233474, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001745078033222418}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.04207195309354536, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011458322627199238}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.13984894212789747, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0044166136430229454}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.1340573709320961, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0031951681845401422}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.0970712318345091, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002118544001686245}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.14388054529296093, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004453879377805569}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.14043655820750423, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003394973082402341}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.10190557193119215, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022803567703003585}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_1.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..5774c7f78e1d0282a71f82b3ccf52eb98ece792b --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.253787105095654, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1531956101772429}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5916925132644157, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00322106862270845}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4463736554053124, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0030343957764200962}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.48227052690365063, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002317881335104088}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2838064949819702, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0027789665070579485}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2105351617568858, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022171957363924296}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.22765626131798156, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020703831562182183}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.43217159380951586, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029973445963260422}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.32230580960354577, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024575923055788883}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.34946822459925764, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020719433030147168}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.48366766620362545, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0032029340181387936}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.36354140064435775, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027910193529178087}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3932633862316688, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002340814619008484}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_2.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..c8ad3f50f6c6aff4c99b2e683819ee12a165eea1 --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.934222887897532, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.21278791413856055}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6137196300402722, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031475076717186906}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.48231229181347424, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002994935365094384}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5160444555536067, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00228951307038736}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.3128748478554642, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0028571435877434844}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.24224424588278937, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002338319832959116}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2594509643808628, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021848217582054836}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4496161361042401, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002965960715542685}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.35106979956416473, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025186871703425898}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.37626113256931526, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021363134322449147}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5075541777391559, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003180746032746745}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3982152959674102, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002838831357019365}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.42631762287613684, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00239431216095114}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_3.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..5f9d48d1878d1d5ac8c20c909c5164b41e070806 --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 15.550166229098965, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.21100324131614723}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6164424274284126, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031180799828950793}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.49077882213900875, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002902655623188235}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5240247422123916, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022364704364336795}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.3165046826237152, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002782884317807398}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.24838679979596562, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023021548981493603}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2655834480484239, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021599553939183514}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.45453733777109134, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029846320407150165}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.35943496219625287, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002503259775759038}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.38460762326164105, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021692227869033478}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5148376263253541, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031730624992959006}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4092664706750279, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002806743229599867}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4372484038981659, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002394606287079693}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_4.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..03ac5c92eab91184b9f7e63a6c43af9b990d35b0 --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 15.882734366339575, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.20014792318307217}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.617829970748385, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031627975477214964}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4934813921824228, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028974554963002866}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5268811401300224, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002296537855184882}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.31982595333569097, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002834806640598152}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2524396113719004, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002374239958755143}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2697484320297564, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0022376325121211964}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4547884196194121, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029857683967765883}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.36242825370807497, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00256326606590863}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.38708461902411606, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002242571110085911}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5162937268213095, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003187124832415968}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4128904038699314, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028402630566630306}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4406025001412695, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024516808057243426}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_5.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..fb9ea901aa5e97e89b623956115c4abf6b1ad09b --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 15.843755546529314, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.23380050838762192}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6189660173531598, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003202216597059111}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.49387787166933184, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00292152626004202}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5268007980171965, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022830659821340285}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.32113506253536717, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002823936183018856}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.25289072399317875, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023526916821315917}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.26998871183013234, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021968682565042135}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.45492486270003574, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002993407598047982}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3622504836542661, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002569318863258077}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.38651546157123484, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002221892359998622}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5179172358492237, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0032140290174150392}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4135121055179984, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028519351140784115}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.44101339790167177, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024405926593214712}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_gem_xsum_article_DOC_summary_0.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..fcc2d2bd5efc27028d125acd459ce9ccfd399cf8 --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.16834475552405148, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002143734509300351}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3812302941527284, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004466228338306761}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.22900899484830875, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002592170416843644}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.04090800254887081, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001331305757616898}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.09717669760813316, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0031305903631064793}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.056521580391250686, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0017743435854162372}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.12317643828521285, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017773839864967875}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2797265709939456, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0036566609405842706}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.16720327598962526, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020460047183396978}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.1339383429556578, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0019089490816378235}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.3045528042834054, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004033519848039268}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.18208585408505043, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00227028405987386}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.4021403698389303, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.067244017856741}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_gem_xsum_article_DOC_summary_1.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..77524186fcae6b2de62c90228c2d2d4b7d420d89 --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.2269075171314588, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004333302214651766}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.24532990314212508, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003988402379243326}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.22010181845678548, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0035289902424468713}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.052629985612383176, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026272197223151062}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.05514694411681367, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002420925395374345}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04964766400970655, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002214536505649702}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.1721080105359506, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003568699794613313}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.18654158462763012, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0032259213006477503}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.16668249804551818, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002858700548419538}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.17318677280555747, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0035702087618089537}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.18887685302453283, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003346146632601525}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.168054574737479, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0028788648929427077}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.587973656923586, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.18271829592693106}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_gem_xsum_article_DOC_summary_2.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..6c1ef836dc520f0b5a2173828c6a89cd61cf7ca7 --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.23962839287439405, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004379685148326459}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.24084621475655701, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003791189958412602}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.22681874696670282, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0035634918232377074}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.05825281986003038, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026810505602905777}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.056775559678677465, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002426834325647628}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.05421648195620343, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0023479794051376422}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.1845331825452337, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003580958301916115}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.18702023658313446, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003174519635609054}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.17492387767242143, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0029179836282209}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.1851109498506353, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0035857038136326946}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.1874180466959014, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0031802199539878143}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.17541718007715307, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0029228112018755566}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.894349555094649, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.20938561045016857}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_gem_xsum_article_DOC_summary_3.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..a4bcccfb73f550571b354d2e1c709600c13d2d76 --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.2493216186518576, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0049084458961309585}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.23437481439478378, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00414167551937926}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.22875361771029976, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004084338493816929}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.06426035314217526, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0029430708789924724}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.05825170712730457, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0025593535615914685}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.058170472646030105, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002575465227066567}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.19044444305113, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004057392892502295}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.1796956624879631, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0034464435487860908}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.17477557833568425, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003389234359734604}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.19176785292110343, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004051683679981941}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.1817729140455351, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0034769204180304563}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.17624162420032213, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0033874175464656286}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 3.3807185036949794, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.21747997288721058}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_gem_xsum_article_DOC_summary_4.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..29397d0803d969c105edd7c06eea75a1491e3a4c --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.06368749975876878, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004163291649927898}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.05633355721143847, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003674327931986382}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.055495095278546853, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0035332699011158906}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.01625809935844295, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001744008450570692}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.014127871826558468, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014279592951878697}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.014126745787126624, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014244420667161892}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.048922678698080466, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003321571568066582}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.04260833742058202, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0028433365851945613}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.042006581084650725, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002736359920016333}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.049121011091270275, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0033301554897141204}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.042965789423027506, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028912525537101723}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.04223553974124363, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0027526558135678226}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.11188091321184003, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.02931669237987178}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/agg.8b7178b58b_gem_xsum_article_DOC_summary_5.json b/8b7178b58b/evaluation/generation/agg.8b7178b58b_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..6d015fd3c07147e4bd2c28bffb5b62ce0bf85fce --- /dev/null +++ b/8b7178b58b/evaluation/generation/agg.8b7178b58b_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.002666427538603693, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001013100557726815}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.0025861091150659685, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0008630243879275325}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.002533146063446972, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008926774274323296}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0007974546793721661, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0004389545775956508}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0006295661715078737, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00030074990914758437}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0006840490507628032, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00035126113759812106}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.002022260888604123, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0008452973095491474}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0018561449826780235, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0006574742336350735}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0018694866909844472, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0007140136174659965}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.00205235327222183, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0008479115148274438}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.0019247556173263936, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0006749866649238696}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0019113224438188196, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.000720026623055153}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.2560041633308834e-45, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.8421463064085026e-30}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 4, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_0.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..02f193528cebac6125d7eddfe7fd1bf1215c2f04 --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:999314d630dfd9d528eaa6230f070bb1f3db2faf5eea5e2e962a536be45282a9 +size 3826859 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_1.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..12602e07fec6ff24ec5c8477fe78c1618825cf6f --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:685e819c0eb246cad2b68f001632bee56372b55a7ae05f7b3c206cacd6e69d1b +size 4675327 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_2.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b9f5864400e1639c9dbc7f7719f3e6d4bd211bbd --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05fba4233df83d76565f5204a6e91220b7897a475fb332bcfe429776427d2a7d +size 5544035 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_3.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..68363e7e66de3862c38f34ba0669bb2375d3861f --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b91afc186928b41b01d7580f6487c376c8acb60f71bfad13d4f81b92c3bc9ee6 +size 6450894 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_4.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d4c1d86737dcee5b28bb6de7c016067d4f0d1220 --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c946648dd00705a87ead7c8922ccfbfc3bbe8d28246880b2bbe610b7f6e22242 +size 7355578 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_5.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e9dde2ea4aada6e763df7392c6a846e65cbc66bf --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:060a7dee2d30e7d20d468323adfbaa24e21010912a63ac0a83c71e42611d0d83 +size 8203278 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_0.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..cfc312a4c2ff1b2510351e7a3f527086ba9b9917 --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6d01dc9f2c851a0a9ba0041c33a7769f1d407bc6610552b147bf28b3fcbf1eb +size 7474008 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_1.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..806456a5ca76140756f9aa5544b6293b6d5c880e --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:073d9ea4667f0197b6c0ac0508ebd5d9fd085e9c0ca9fc2d61f4e3ef2ae9caad +size 12974793 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_2.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..27e00a6abc6b9b1d93c9bfba6227bad79fd7363b --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6c5d1d9a19c179c3ac04bb0aaac662c0680c22b70a21dbd4dade5f5b2205fe9 +size 18511889 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_3.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a518d5ddb1b6733f8927142ae4b7aaebae7033d4 --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edd1393814c2a1311185bcb30b2bf7ac4aeb32eaf4ad91300efb80ce87b1f086 +size 23979958 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_4.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..73233c64dee23279237279557a6f277d908bd76a --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f120116c84c04d47b762b3dee5be12da1b87cf8ef18fbbde9dee1231935734b5 +size 29348945 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_5.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5b836fc0e14c24d40f2cd1265b5986fb1466edc8 --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7211f33c7d358f67c5f5471cb174ed187e36ad79ee97136d17f78748c78766b +size 34781314 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e2374daff4244c84158472ae056dad76e5f4279d --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b7f8396f30f4b424731f872fb7dd5598220e06b58bcaf214ab85950a6986b74 +size 3913147 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..957213962fff4acfe110b6b5b71e310d922482d3 --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e54542fa9e8b72e1a2245fa6e07b548a61234b0544ba6b593d54e16a0736ef8b +size 4995721 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2d4464946c86b9f811d8f1b108d65bdb2a993597 --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:167e34641de8e0f3a38a77887598ad043f6ebfe197eb73d2e492aea39b07a8b8 +size 6088962 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e62ddafd2762b86a1faa8a50865cb32747bc517f --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ceb66a51106fedd8264816b8abfa2f84e235054f99b903b86924eb4b37c627e0 +size 7173918 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c9057ddaf5d0c8977f33556376b9a559b856131a --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0124e953ce167c49cc75b7e5e99b0dfdfe7b4d7546a2afaed6cb8018b31b2ed0 +size 8254009 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1577506c63fa798371514540451d423ee92e3bff --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dceb72df16567da24b8811e1fd6063e46501a02782563c2d9c97404d3014877 +size 9340395 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_0.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7585b8d868c2f07a2f38743392fe997d09a9106b --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cd5e50bf6dd8a1f8ab6336ae348fb85af79fafb3a63aa295c28a3d1ab9ec6f0 +size 2819929 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_1.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e7abf69651e820a2d1a539de9b67d35ebf0a4966 --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2254c0b7c6d11284e31faf794426e4e69e1e227e24682d1c6adace48e70a6ea9 +size 4932939 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_2.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6767e2e5acf7e1db9c421bbca3e4b16a599da3ca --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4060246592b6d614bd4c7996e5c2dbe95e0f26cef29c0c8bbcb242e8e1a1f097 +size 7191441 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_3.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d15d13280798a1047f7b4484c8e1cb50eb24b9a4 --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:854251bf91963cde44115e46953bbd4e9a698807a8561fde1a3785376573a57f +size 9465177 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_4.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2706c1bcada1b699bf4991a33a60c51e0be7f245 --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a8a42c49f8d54de427f4765071db6b54a45cfbd67330506153201ce56fa27f2 +size 11626705 diff --git a/8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_5.jsonl b/8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..25572edf78cdffedafb51c41851542b4b9651620 --- /dev/null +++ b/8b7178b58b/evaluation/generation/examples.8b7178b58b_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61a6f2c75b042d4bc922fab9249987870fdb860d2d115ae74cde1b1bd038913c +size 13897275 diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-web_nlg_en_PALM_prompt_0.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..d3d4c9e8edebac439fde7b95ae237f11430f0539 --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.4214863735405607, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.029154609162010323 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.08388349369737222, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0028741362760589364 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2839223617284565, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005264418568471245 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10879688033992795, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0021627779616647516 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.04057930751764507, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.002047816625134428 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.13506279227711254, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0032130647312794175 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05055369077754123, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012930809657985872 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.08041455507307416, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002796739709192279 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2738666536323073, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.005085678508176572 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10393401018258999, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.002007764403266908 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07977634567972974, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002805961856125458 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.26749167398935675, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004882015301399527 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10270283885145984, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002020111493088052 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-web_nlg_en_PALM_prompt_1.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..a92747fe1835193c41e73763dcf641feb1e722f3 --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5958530874585899, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03649262475380295 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.13749267610186958, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004325878829249963 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3241716808952326, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005125119098986173 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.16359576779434043, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.003809967310568941 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.07246358161159391, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0029673895627135506 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.16876397664351184, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.00367859006299185 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.08433674778206289, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.002591174609210514 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.12393180075905823, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0037992843733980434 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.30308740481864604, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004697897076217226 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.14881701677232517, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003277859581563782 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.12662324522811608, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.00387820514144903 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3067988164213401, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004754578958904846 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.15170700107447863, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0033575398797432874 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-web_nlg_en_PALM_prompt_2.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..d1c3d7e77b9d32d7b7c6264acf0648533dc2dfcb --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.7632123296691333, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.038667647524407975 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.17619531326285107, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005080542288823818 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3742085058586801, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004920653945655996 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.2022385311781214, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004271916206549367 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.09658792599721289, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.003611262853993622 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20162933402440936, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0038801577073926965 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.10803467148430693, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0030612514779265803 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.15692981536908263, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004446297762122498 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3484780480719596, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0045553445266088635 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.18252899170611903, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0037263532749030616 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.16217269474751653, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004631557820535045 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.35330840347834674, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004610857396095154 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.18711611785244323, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.003848891104616288 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-web_nlg_en_PALM_prompt_3.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..ea884486e07e2523f6420964a13c98e0c5e99c9c --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.9207133879279265, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03255931768193071 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.18377058302813723, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005253580997340217 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.381271206422023, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004890766475780684 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.20867536510345913, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004354382473584997 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.10294612127680682, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0037309770662019557 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.2060814488662053, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0038997213229875847 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.11272429502619766, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0031312620749979446 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.16232375389423376, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0045761676741338285 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.35147344800261143, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004418957418369871 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.18616032806880206, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003714239240740623 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.16801891503402527, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004781137280246318 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3573456612646077, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004500705918880425 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.19151809123693445, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.003873742236641197 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-web_nlg_en_PALM_prompt_4.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..8816849dc14ecf3f095fa8d47616d2f2c1a01816 --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.9902518578876233, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.040737732761129415 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.18789368573901274, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005285851879717852 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3899093270922249, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004962887842702003 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.21290146130579965, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0043700834724458276 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.10560975558011194, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.003731700714381224 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.2145796483953565, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.004035868026365014 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.11683410537192468, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0031833984768610346 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.16382625310518403, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004486884267673038 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3597071518828505, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004521922524975513 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1890303353482411, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003700023042470156 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.1707530708743364, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004732141735621611 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.36629613801895733, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004591525609735619 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.19508857877285685, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.003865606407547543 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-web_nlg_en_PALM_prompt_5.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..b5423137df378b655875c6ed987827272c3be92e --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 1.0873761263949675, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03934330697010386 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.2117037418048869, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005797595530762211 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.39911584774379655, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00498148260658174 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.23018635133450477, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004612080716063762 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.12132204155512089, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.004137193433006742 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.2209500964153402, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.004025388576844993 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.12701615271509778, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.003293666322506656 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.18406790377006843, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004937322660278917 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.36561941279365967, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004496892763588926 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.20292345789497096, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003854003762475144 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.19092590715178714, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.005162190150819128 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3726247925460039, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004574209186658482 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.20912697515193987, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00401671896906783 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-wiki_lingua_en_tldr_en_0.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..dcd64c00dba2500aa400b6cda334fd61850b8b71 --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.14513591635070752, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002933831212103272 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.19891787194668262, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.003187558635297779 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1485707360665655, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0023637963366588163 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.029907874227091444, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000921657729333574 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04649017309040178, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0014882369637529544 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03346604327851081, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009887781706946746 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11668487543384909, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002498896390227391 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.16129272420830681, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002571624720811961 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.11823159104307632, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0017829954318414592 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.13518764121791138, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0028124634604811717 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.18445870962398936, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0029688108031568614 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.13755330088318402, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00219534310275043 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.318732566456423, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.13881817798189033 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-wiki_lingua_en_tldr_en_1.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..79161c2dfc8a160a85e47496056dc61bc38760e3 --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.248970781629388, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.003874261949118977 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.20254661208456856, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0028554953044439015 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.18955083016621427, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002379156871875284 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0689782299271333, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.002313495667945766 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.049284004115414136, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0014678263918321242 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04746965955266556, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0013357687513664974 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.19495136652936196, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0032222442707770895 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1564134625395888, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002249411692052382 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.14594622749474678, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018424648214888 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.23507901615131913, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0036892088805215145 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.19138092032456272, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002706865345022287 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.17879643931529124, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022381896082302615 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.926117660825783, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0707920058779335 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-wiki_lingua_en_tldr_en_2.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..81848a815150e4619c341aba2d2e87686efc0015 --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.35679011396950494, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0039535541787012966 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2525122163812022, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0028104769002719686 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.25402066807919726, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0022729602698409765 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.11566892110217673, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0025968459819964438 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0758485270748662, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016494845495132536 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.07776422929510499, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0015470867437394145 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.2787485396392972, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.00333060867857478 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1946844152208185, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002269590023349728 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.19606027302517406, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018502837344183064 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.33780149114906943, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.003819320386381285 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.23865291484527454, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027000637562272383 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.24005412545885543, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0021905454232920693 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 4.482664241932101, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.08212180996103731 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-wiki_lingua_en_tldr_en_3.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..f8c1e301bd23f320d41aea135cb84215e6f89441 --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.3061484539454385, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004423098151670539 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.20167165147009586, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.003037208327664155 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.2113115990683054, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0027547750855983046 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.10017174467185903, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.002669280506981759 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06128388820701079, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016275016915406385 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.06469489115245816, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0015394791419511076 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.2427018640988824, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0037099343074804333 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1573050958528797, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002452551923134493 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1649989495768865, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.002208842551468564 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.29051399119634647, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004266689720705603 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.19088557384190263, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0029163289376507914 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.19989739105994972, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0026343775714049306 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.0072655046058805, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.09596043858220096 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-wiki_lingua_en_tldr_en_4.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..35bb605a5fa25fb6edf87a031bc0dd0801664d93 --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.09734210523837013, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.003585657330962349 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.06338401184872311, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002461970340537986 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.06646559577850898, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002389468792903583 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0321171525149136, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0017883302892353346 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.019779405420936473, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0011693482689711905 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.020767091534965167, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001088077081953597 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.07721998831670598, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002911924342353414 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.05016221089779053, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.001994888739662481 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.05241812699049824, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0019162468765830335 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.09174287392107108, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0034181860926286 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.05945776168044872, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0023246003955623533 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.062355467850168954, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022529742622293867 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.02961687910857089, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.00667797537003518 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-wiki_lingua_en_tldr_en_5.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..b26a8ea0ff610335b09d38ee07c16fbc045a0395 --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.01662223836437527, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0017200192815433816 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.010369987242786843, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0011350821871749513 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.010515163702672926, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001060191799945764 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0056669762870846345, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008937346232787428 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0035137406087487875, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0005888971524329703 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0034609320209794962, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.000506080127090741 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.013605527079975888, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014624549576253666 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.008580131540181942, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0009742333834018987 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.00858027237742148, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0008896522724178397 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.015819080798652796, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001649211944475785 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.009938412449545603, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0011052383189021134 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.010008632917285501, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0010183013884774283 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 5.0425595242130537e-17, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 5.828914972997529e-15 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_0.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e4de9fef4b618a75151df1ea0e19d109c6e12d97 --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 3.727703428672484, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.16225275145292814 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.15580458811715164, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.004522055277902883 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.16212105310140335, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0038770863196531777 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.11677483396146617, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0026043522717618377 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.08759078800738393, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.004060781916683637 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.05918434764233474, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001745078033222418 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.04207195309354536, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0011458322627199238 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.13984894212789747, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0044166136430229454 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.1340573709320961, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0031951681845401422 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.0970712318345091, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002118544001686245 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.14388054529296093, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.004453879377805569 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.14043655820750423, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.003394973082402341 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.10190557193119215, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022803567703003585 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_1.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..c097d593417aaef6c2c3ee6910d7986a37ff0292 --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.253787105095654, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1531956101772429 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5916925132644157, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.00322106862270845 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4463736554053124, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0030343957764200962 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.48227052690365063, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002317881335104088 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2838064949819702, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0027789665070579485 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2105351617568858, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022171957363924296 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.22765626131798156, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020703831562182183 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.43217159380951586, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029973445963260422 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.32230580960354577, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024575923055788883 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.34946822459925764, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020719433030147168 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.48366766620362545, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0032029340181387936 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.36354140064435775, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027910193529178087 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3932633862316688, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002340814619008484 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_2.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..9da7d3ddbd98c89669563bdfd09457f6152c5afb --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.934222887897532, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.21278791413856055 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6137196300402722, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031475076717186906 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.48231229181347424, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002994935365094384 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5160444555536067, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.00228951307038736 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.3128748478554642, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0028571435877434844 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.24224424588278937, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002338319832959116 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2594509643808628, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0021848217582054836 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4496161361042401, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002965960715542685 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.35106979956416473, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025186871703425898 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.37626113256931526, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021363134322449147 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5075541777391559, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003180746032746745 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3982152959674102, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002838831357019365 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.42631762287613684, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00239431216095114 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_3.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..6563b0a116a0667ebac79705af25432487a4656a --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 15.550166229098965, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.21100324131614723 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6164424274284126, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031180799828950793 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.49077882213900875, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002902655623188235 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5240247422123916, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022364704364336795 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.3165046826237152, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002782884317807398 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.24838679979596562, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023021548981493603 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2655834480484239, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0021599553939183514 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.45453733777109134, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029846320407150165 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.35943496219625287, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002503259775759038 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.38460762326164105, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021692227869033478 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5148376263253541, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031730624992959006 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4092664706750279, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002806743229599867 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4372484038981659, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002394606287079693 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_4.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..923969cd89a4abc6d8e4caa1b81598588995b411 --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 15.882734366339575, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.20014792318307217 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.617829970748385, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031627975477214964 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4934813921824228, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028974554963002866 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5268811401300224, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002296537855184882 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.31982595333569097, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002834806640598152 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2524396113719004, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002374239958755143 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2697484320297564, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0022376325121211964 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4547884196194121, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029857683967765883 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.36242825370807497, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.00256326606590863 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.38708461902411606, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002242571110085911 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5162937268213095, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003187124832415968 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4128904038699314, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0028402630566630306 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4406025001412695, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0024516808057243426 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_5.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..661149eac168192b9a4ce0ea2c6884ffb3b3a233 --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 15.843755546529314, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.23380050838762192 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6189660173531598, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003202216597059111 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.49387787166933184, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.00292152626004202 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5268007980171965, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022830659821340285 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.32113506253536717, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002823936183018856 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.25289072399317875, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023526916821315917 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.26998871183013234, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0021968682565042135 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.45492486270003574, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002993407598047982 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3622504836542661, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002569318863258077 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.38651546157123484, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002221892359998622 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5179172358492237, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0032140290174150392 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4135121055179984, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0028519351140784115 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.44101339790167177, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0024405926593214712 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_gem_xsum_article_DOC_summary_0.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..732bee5753e031573fd1c802e58c3b8d1800c284 --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.16834475552405148, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002143734509300351 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3812302941527284, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004466228338306761 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.22900899484830875, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002592170416843644 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.04090800254887081, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.001331305757616898 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.09717669760813316, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0031305903631064793 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.056521580391250686, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0017743435854162372 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.12317643828521285, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0017773839864967875 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2797265709939456, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0036566609405842706 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.16720327598962526, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0020460047183396978 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.1339383429556578, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0019089490816378235 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.3045528042834054, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.004033519848039268 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.18208585408505043, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.00227028405987386 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.4021403698389303, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.067244017856741 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_gem_xsum_article_DOC_summary_1.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..6802cd32ba1d96b65a514c06e817b4064c462c52 --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.2269075171314588, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.004333302214651766 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.24532990314212508, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003988402379243326 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.22010181845678548, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0035289902424468713 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.052629985612383176, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0026272197223151062 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.05514694411681367, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002420925395374345 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04964766400970655, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.002214536505649702 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.1721080105359506, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.003568699794613313 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.18654158462763012, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0032259213006477503 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.16668249804551818, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002858700548419538 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.17318677280555747, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0035702087618089537 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.18887685302453283, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003346146632601525 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.168054574737479, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0028788648929427077 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.587973656923586, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.18271829592693106 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_gem_xsum_article_DOC_summary_2.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..74f2cc55fa8168562e8c2ca705f2f9430ad6191d --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.23962839287439405, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.004379685148326459 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.24084621475655701, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003791189958412602 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.22681874696670282, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0035634918232377074 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.05825281986003038, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0026810505602905777 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.056775559678677465, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002426834325647628 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.05421648195620343, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0023479794051376422 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.1845331825452337, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.003580958301916115 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.18702023658313446, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003174519635609054 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.17492387767242143, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0029179836282209 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.1851109498506353, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0035857038136326946 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.1874180466959014, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0031802199539878143 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.17541718007715307, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0029228112018755566 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.894349555094649, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.20938561045016857 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_gem_xsum_article_DOC_summary_3.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..fba2e072ed53402b9f8aecd25cbfa412f410476f --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.2493216186518576, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0049084458961309585 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.23437481439478378, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.00414167551937926 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.22875361771029976, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.004084338493816929 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.06426035314217526, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0029430708789924724 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.05825170712730457, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0025593535615914685 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.058170472646030105, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.002575465227066567 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.19044444305113, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.004057392892502295 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.1796956624879631, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0034464435487860908 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.17477557833568425, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.003389234359734604 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.19176785292110343, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.004051683679981941 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.1817729140455351, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0034769204180304563 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.17624162420032213, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0033874175464656286 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 3.3807185036949794, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.21747997288721058 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_gem_xsum_article_DOC_summary_4.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..e7a14f1d307e4ff0ad1302b1e991686ebf3d5aa9 --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.06368749975876878, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.004163291649927898 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.05633355721143847, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003674327931986382 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.055495095278546853, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0035332699011158906 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.01625809935844295, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.001744008450570692 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.014127871826558468, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0014279592951878697 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.014126745787126624, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014244420667161892 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.048922678698080466, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.003321571568066582 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.04260833742058202, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0028433365851945613 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.042006581084650725, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002736359920016333 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.049121011091270275, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0033301554897141204 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.042965789423027506, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0028912525537101723 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.04223553974124363, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0027526558135678226 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.11188091321184003, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.02931669237987178 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/generation/slim.8b7178b58b_gem_xsum_article_DOC_summary_5.json b/8b7178b58b/evaluation/generation/slim.8b7178b58b_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..13f9153062a4441707a991bb553093e6b4550610 --- /dev/null +++ b/8b7178b58b/evaluation/generation/slim.8b7178b58b_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.002666427538603693, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.001013100557726815 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.0025861091150659685, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0008630243879275325 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.002533146063446972, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0008926774274323296 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0007974546793721661, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0004389545775956508 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0006295661715078737, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00030074990914758437 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0006840490507628032, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00035126113759812106 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.002022260888604123, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0008452973095491474 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0018561449826780235, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0006574742336350735 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0018694866909844472, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0007140136174659965 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.00205235327222183, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0008479115148274438 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.0019247556173263936, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0006749866649238696 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0019113224438188196, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.000720026623055153 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.2560041633308834e-45, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 1.8421463064085026e-30 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b58b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 4, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/rankeval/8b7178b58b_0.json b/8b7178b58b/evaluation/rankeval/8b7178b58b_0.json new file mode 100644 index 0000000000000000000000000000000000000000..d7f2f704eb7b6e0869a9a13f0d23adec536a1710 --- /dev/null +++ b/8b7178b58b/evaluation/rankeval/8b7178b58b_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.331, + "acc_stderr": 0.014888272588203936 + }, + "anli_r2": { + "acc": 0.336, + "acc_stderr": 0.014944140233795027 + }, + "anli_r3": { + "acc": 0.3425, + "acc_stderr": 0.013704669762934727 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.21956970232832299 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.044084400227680794 + }, + "hellaswag": { + "acc": 0.4480183230432185, + "acc_stderr": 0.004962742426849887, + "acc_norm": 0.5839474208325035, + "acc_norm_stderr": 0.0049189510191838875 + }, + "rte": { + "acc": 0.5631768953068592, + "acc_stderr": 0.029855247390314945 + }, + "winogrande": { + "acc": 0.5730071033938438, + "acc_stderr": 0.01390187807257506 + }, + "storycloze_2016": { + "acc": 0.6916087653661144, + "acc_stderr": 0.010679734445487797 + }, + "boolq": { + "acc": 0.5892966360856269, + "acc_stderr": 0.008604460608471413 + }, + "arc_easy": { + "acc": 0.609006734006734, + "acc_stderr": 0.010012992232540633, + "acc_norm": 0.5593434343434344, + "acc_norm_stderr": 0.010187264635711991 + }, + "arc_challenge": { + "acc": 0.2781569965870307, + "acc_stderr": 0.013094469919538816, + "acc_norm": 0.29436860068259385, + "acc_norm_stderr": 0.013318528460539426 + }, + "sciq": { + "acc": 0.865, + "acc_stderr": 0.010811655372416053, + "acc_norm": 0.793, + "acc_norm_stderr": 0.012818553557843983 + }, + "piqa": { + "acc": 0.7442872687704026, + "acc_stderr": 0.010178690109459857, + "acc_norm": 0.7546245919477693, + "acc_norm_stderr": 0.010039831320422386 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/rankeval/8b7178b58b_0_lm-eval_global_step84877_2023-02-04-19-09-29_0shots_backup.json b/8b7178b58b/evaluation/rankeval/8b7178b58b_0_lm-eval_global_step84877_2023-02-04-19-09-29_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..d7f2f704eb7b6e0869a9a13f0d23adec536a1710 --- /dev/null +++ b/8b7178b58b/evaluation/rankeval/8b7178b58b_0_lm-eval_global_step84877_2023-02-04-19-09-29_0shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.331, + "acc_stderr": 0.014888272588203936 + }, + "anli_r2": { + "acc": 0.336, + "acc_stderr": 0.014944140233795027 + }, + "anli_r3": { + "acc": 0.3425, + "acc_stderr": 0.013704669762934727 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.21956970232832299 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.044084400227680794 + }, + "hellaswag": { + "acc": 0.4480183230432185, + "acc_stderr": 0.004962742426849887, + "acc_norm": 0.5839474208325035, + "acc_norm_stderr": 0.0049189510191838875 + }, + "rte": { + "acc": 0.5631768953068592, + "acc_stderr": 0.029855247390314945 + }, + "winogrande": { + "acc": 0.5730071033938438, + "acc_stderr": 0.01390187807257506 + }, + "storycloze_2016": { + "acc": 0.6916087653661144, + "acc_stderr": 0.010679734445487797 + }, + "boolq": { + "acc": 0.5892966360856269, + "acc_stderr": 0.008604460608471413 + }, + "arc_easy": { + "acc": 0.609006734006734, + "acc_stderr": 0.010012992232540633, + "acc_norm": 0.5593434343434344, + "acc_norm_stderr": 0.010187264635711991 + }, + "arc_challenge": { + "acc": 0.2781569965870307, + "acc_stderr": 0.013094469919538816, + "acc_norm": 0.29436860068259385, + "acc_norm_stderr": 0.013318528460539426 + }, + "sciq": { + "acc": 0.865, + "acc_stderr": 0.010811655372416053, + "acc_norm": 0.793, + "acc_norm_stderr": 0.012818553557843983 + }, + "piqa": { + "acc": 0.7442872687704026, + "acc_stderr": 0.010178690109459857, + "acc_norm": 0.7546245919477693, + "acc_norm_stderr": 0.010039831320422386 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/rankeval/8b7178b58b_1.json b/8b7178b58b/evaluation/rankeval/8b7178b58b_1.json new file mode 100644 index 0000000000000000000000000000000000000000..81fd740f50c4352b50b02492c16a0784353465ae --- /dev/null +++ b/8b7178b58b/evaluation/rankeval/8b7178b58b_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.337, + "acc_stderr": 0.014955087918653605 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.014976758771620345 + }, + "anli_r3": { + "acc": 0.33, + "acc_stderr": 0.013579531277800923 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.06724777654937658, + "f1": 0.32751039809863336 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932261 + }, + "hellaswag": { + "acc": 0.4508066122286397, + "acc_stderr": 0.004965572246803864, + "acc_norm": 0.5974905397331209, + "acc_norm_stderr": 0.004894012555642632 + }, + "rte": { + "acc": 0.5018050541516246, + "acc_stderr": 0.030096267148976626 + }, + "winogrande": { + "acc": 0.5611681136543015, + "acc_stderr": 0.013946933444507032 + }, + "storycloze_2016": { + "acc": 0.7001603420630679, + "acc_stderr": 0.010595525174558598 + }, + "boolq": { + "acc": 0.618348623853211, + "acc_stderr": 0.008496550741178263 + }, + "arc_easy": { + "acc": 0.63510101010101, + "acc_stderr": 0.009878157021155649, + "acc_norm": 0.625, + "acc_norm_stderr": 0.009933992677987828 + }, + "arc_challenge": { + "acc": 0.2901023890784983, + "acc_stderr": 0.01326157367752076, + "acc_norm": 0.3174061433447099, + "acc_norm_stderr": 0.01360223908803817 + }, + "sciq": { + "acc": 0.905, + "acc_stderr": 0.009276910103103317, + "acc_norm": 0.906, + "acc_norm_stderr": 0.009233052000787735 + }, + "piqa": { + "acc": 0.7470076169749728, + "acc_stderr": 0.01014288869886246, + "acc_norm": 0.7486398258977149, + "acc_norm_stderr": 0.01012115601681924 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/rankeval/8b7178b58b_1_lm-eval_global_step84877_2023-02-04-19-09-29_1shots_backup.json b/8b7178b58b/evaluation/rankeval/8b7178b58b_1_lm-eval_global_step84877_2023-02-04-19-09-29_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..81fd740f50c4352b50b02492c16a0784353465ae --- /dev/null +++ b/8b7178b58b/evaluation/rankeval/8b7178b58b_1_lm-eval_global_step84877_2023-02-04-19-09-29_1shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.337, + "acc_stderr": 0.014955087918653605 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.014976758771620345 + }, + "anli_r3": { + "acc": 0.33, + "acc_stderr": 0.013579531277800923 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.06724777654937658, + "f1": 0.32751039809863336 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932261 + }, + "hellaswag": { + "acc": 0.4508066122286397, + "acc_stderr": 0.004965572246803864, + "acc_norm": 0.5974905397331209, + "acc_norm_stderr": 0.004894012555642632 + }, + "rte": { + "acc": 0.5018050541516246, + "acc_stderr": 0.030096267148976626 + }, + "winogrande": { + "acc": 0.5611681136543015, + "acc_stderr": 0.013946933444507032 + }, + "storycloze_2016": { + "acc": 0.7001603420630679, + "acc_stderr": 0.010595525174558598 + }, + "boolq": { + "acc": 0.618348623853211, + "acc_stderr": 0.008496550741178263 + }, + "arc_easy": { + "acc": 0.63510101010101, + "acc_stderr": 0.009878157021155649, + "acc_norm": 0.625, + "acc_norm_stderr": 0.009933992677987828 + }, + "arc_challenge": { + "acc": 0.2901023890784983, + "acc_stderr": 0.01326157367752076, + "acc_norm": 0.3174061433447099, + "acc_norm_stderr": 0.01360223908803817 + }, + "sciq": { + "acc": 0.905, + "acc_stderr": 0.009276910103103317, + "acc_norm": 0.906, + "acc_norm_stderr": 0.009233052000787735 + }, + "piqa": { + "acc": 0.7470076169749728, + "acc_stderr": 0.01014288869886246, + "acc_norm": 0.7486398258977149, + "acc_norm_stderr": 0.01012115601681924 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/rankeval/8b7178b58b_2.json b/8b7178b58b/evaluation/rankeval/8b7178b58b_2.json new file mode 100644 index 0000000000000000000000000000000000000000..2d9032e3e2b2f1daa6379ebd0d6233a9b12d1833 --- /dev/null +++ b/8b7178b58b/evaluation/rankeval/8b7178b58b_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.325, + "acc_stderr": 0.014818724459095526 + }, + "anli_r2": { + "acc": 0.326, + "acc_stderr": 0.014830507204541033 + }, + "anli_r3": { + "acc": 0.3475, + "acc_stderr": 0.013751753243291854 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.06737697508644648, + "f1": 0.3356643356643356 + }, + "copa": { + "acc": 0.72, + "acc_stderr": 0.04512608598542129 + }, + "hellaswag": { + "acc": 0.4523003385779725, + "acc_stderr": 0.004967023435680015, + "acc_norm": 0.5990838478390759, + "acc_norm_stderr": 0.004890824718530304 + }, + "rte": { + "acc": 0.49458483754512633, + "acc_stderr": 0.030094698123239966 + }, + "winogrande": { + "acc": 0.5911602209944752, + "acc_stderr": 0.013816954295135686 + }, + "storycloze_2016": { + "acc": 0.694815606627472, + "acc_stderr": 0.010648664383985665 + }, + "boolq": { + "acc": 0.6039755351681957, + "acc_stderr": 0.008553881336813412 + }, + "arc_easy": { + "acc": 0.6367845117845118, + "acc_stderr": 0.009868397136118794, + "acc_norm": 0.63510101010101, + "acc_norm_stderr": 0.009878157021155649 + }, + "arc_challenge": { + "acc": 0.31569965870307165, + "acc_stderr": 0.013582571095815293, + "acc_norm": 0.3250853242320819, + "acc_norm_stderr": 0.013688147309729124 + }, + "sciq": { + "acc": 0.927, + "acc_stderr": 0.00823035471524406, + "acc_norm": 0.924, + "acc_norm_stderr": 0.008384169266796384 + }, + "piqa": { + "acc": 0.750816104461371, + "acc_stderr": 0.01009188277012022, + "acc_norm": 0.7546245919477693, + "acc_norm_stderr": 0.010039831320422386 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/rankeval/8b7178b58b_2_lm-eval_global_step84877_2023-02-04-19-09-29_2shots_backup.json b/8b7178b58b/evaluation/rankeval/8b7178b58b_2_lm-eval_global_step84877_2023-02-04-19-09-29_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..2d9032e3e2b2f1daa6379ebd0d6233a9b12d1833 --- /dev/null +++ b/8b7178b58b/evaluation/rankeval/8b7178b58b_2_lm-eval_global_step84877_2023-02-04-19-09-29_2shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.325, + "acc_stderr": 0.014818724459095526 + }, + "anli_r2": { + "acc": 0.326, + "acc_stderr": 0.014830507204541033 + }, + "anli_r3": { + "acc": 0.3475, + "acc_stderr": 0.013751753243291854 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.06737697508644648, + "f1": 0.3356643356643356 + }, + "copa": { + "acc": 0.72, + "acc_stderr": 0.04512608598542129 + }, + "hellaswag": { + "acc": 0.4523003385779725, + "acc_stderr": 0.004967023435680015, + "acc_norm": 0.5990838478390759, + "acc_norm_stderr": 0.004890824718530304 + }, + "rte": { + "acc": 0.49458483754512633, + "acc_stderr": 0.030094698123239966 + }, + "winogrande": { + "acc": 0.5911602209944752, + "acc_stderr": 0.013816954295135686 + }, + "storycloze_2016": { + "acc": 0.694815606627472, + "acc_stderr": 0.010648664383985665 + }, + "boolq": { + "acc": 0.6039755351681957, + "acc_stderr": 0.008553881336813412 + }, + "arc_easy": { + "acc": 0.6367845117845118, + "acc_stderr": 0.009868397136118794, + "acc_norm": 0.63510101010101, + "acc_norm_stderr": 0.009878157021155649 + }, + "arc_challenge": { + "acc": 0.31569965870307165, + "acc_stderr": 0.013582571095815293, + "acc_norm": 0.3250853242320819, + "acc_norm_stderr": 0.013688147309729124 + }, + "sciq": { + "acc": 0.927, + "acc_stderr": 0.00823035471524406, + "acc_norm": 0.924, + "acc_norm_stderr": 0.008384169266796384 + }, + "piqa": { + "acc": 0.750816104461371, + "acc_stderr": 0.01009188277012022, + "acc_norm": 0.7546245919477693, + "acc_norm_stderr": 0.010039831320422386 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/rankeval/8b7178b58b_3.json b/8b7178b58b/evaluation/rankeval/8b7178b58b_3.json new file mode 100644 index 0000000000000000000000000000000000000000..35c9675cc3443cbcb45ac6f94aac3627c1d9b4d5 --- /dev/null +++ b/8b7178b58b/evaluation/rankeval/8b7178b58b_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.321, + "acc_stderr": 0.014770821817934656 + }, + "anli_r2": { + "acc": 0.333, + "acc_stderr": 0.014910846164229859 + }, + "anli_r3": { + "acc": 0.3475, + "acc_stderr": 0.013751753243291852 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.269763077644851 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.4523999203345947, + "acc_stderr": 0.004967118575905285, + "acc_norm": 0.5977892850029874, + "acc_norm_stderr": 0.004893418929918259 + }, + "rte": { + "acc": 0.5054151624548736, + "acc_stderr": 0.030094698123239966 + }, + "winogrande": { + "acc": 0.5864246250986582, + "acc_stderr": 0.013840971763195308 + }, + "storycloze_2016": { + "acc": 0.711918760021379, + "acc_stderr": 0.010472537019822575 + }, + "boolq": { + "acc": 0.600611620795107, + "acc_stderr": 0.008566178448007833 + }, + "arc_easy": { + "acc": 0.6359427609427609, + "acc_stderr": 0.009873293392779118, + "acc_norm": 0.6325757575757576, + "acc_norm_stderr": 0.00989255261621155 + }, + "arc_challenge": { + "acc": 0.3122866894197952, + "acc_stderr": 0.013542598541688064, + "acc_norm": 0.33532423208191126, + "acc_norm_stderr": 0.013796182947785566 + }, + "sciq": { + "acc": 0.926, + "acc_stderr": 0.008282064512704159, + "acc_norm": 0.928, + "acc_norm_stderr": 0.008178195576218681 + }, + "piqa": { + "acc": 0.750272034820457, + "acc_stderr": 0.010099232969867488, + "acc_norm": 0.7573449401523396, + "acc_norm_stderr": 0.010002002569708688 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/rankeval/8b7178b58b_3_lm-eval_global_step84877_2023-02-04-19-09-29_3shots_backup.json b/8b7178b58b/evaluation/rankeval/8b7178b58b_3_lm-eval_global_step84877_2023-02-04-19-09-29_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..35c9675cc3443cbcb45ac6f94aac3627c1d9b4d5 --- /dev/null +++ b/8b7178b58b/evaluation/rankeval/8b7178b58b_3_lm-eval_global_step84877_2023-02-04-19-09-29_3shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.321, + "acc_stderr": 0.014770821817934656 + }, + "anli_r2": { + "acc": 0.333, + "acc_stderr": 0.014910846164229859 + }, + "anli_r3": { + "acc": 0.3475, + "acc_stderr": 0.013751753243291852 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.269763077644851 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.4523999203345947, + "acc_stderr": 0.004967118575905285, + "acc_norm": 0.5977892850029874, + "acc_norm_stderr": 0.004893418929918259 + }, + "rte": { + "acc": 0.5054151624548736, + "acc_stderr": 0.030094698123239966 + }, + "winogrande": { + "acc": 0.5864246250986582, + "acc_stderr": 0.013840971763195308 + }, + "storycloze_2016": { + "acc": 0.711918760021379, + "acc_stderr": 0.010472537019822575 + }, + "boolq": { + "acc": 0.600611620795107, + "acc_stderr": 0.008566178448007833 + }, + "arc_easy": { + "acc": 0.6359427609427609, + "acc_stderr": 0.009873293392779118, + "acc_norm": 0.6325757575757576, + "acc_norm_stderr": 0.00989255261621155 + }, + "arc_challenge": { + "acc": 0.3122866894197952, + "acc_stderr": 0.013542598541688064, + "acc_norm": 0.33532423208191126, + "acc_norm_stderr": 0.013796182947785566 + }, + "sciq": { + "acc": 0.926, + "acc_stderr": 0.008282064512704159, + "acc_norm": 0.928, + "acc_norm_stderr": 0.008178195576218681 + }, + "piqa": { + "acc": 0.750272034820457, + "acc_stderr": 0.010099232969867488, + "acc_norm": 0.7573449401523396, + "acc_norm_stderr": 0.010002002569708688 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/rankeval/8b7178b58b_4.json b/8b7178b58b/evaluation/rankeval/8b7178b58b_4.json new file mode 100644 index 0000000000000000000000000000000000000000..19493a615fa2782c480322dd18977b35b1037a18 --- /dev/null +++ b/8b7178b58b/evaluation/rankeval/8b7178b58b_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.324, + "acc_stderr": 0.014806864733738856 + }, + "anli_r2": { + "acc": 0.333, + "acc_stderr": 0.014910846164229873 + }, + "anli_r3": { + "acc": 0.33666666666666667, + "acc_stderr": 0.013647602942406401 + }, + "cb": { + "acc": 0.35714285714285715, + "acc_stderr": 0.0646095738380922, + "f1": 0.2275946275946276 + }, + "copa": { + "acc": 0.8, + "acc_stderr": 0.040201512610368445 + }, + "hellaswag": { + "acc": 0.4509061939852619, + "acc_stderr": 0.004965670398127354, + "acc_norm": 0.5998805018920533, + "acc_norm_stderr": 0.004889210628907973 + }, + "rte": { + "acc": 0.4584837545126354, + "acc_stderr": 0.029992535385373314 + }, + "winogrande": { + "acc": 0.5824782951854776, + "acc_stderr": 0.013859978264440248 + }, + "storycloze_2016": { + "acc": 0.7081774452164618, + "acc_stderr": 0.010512588616199622 + }, + "boolq": { + "acc": 0.5883792048929664, + "acc_stderr": 0.008607357686607963 + }, + "arc_easy": { + "acc": 0.6439393939393939, + "acc_stderr": 0.00982545460841631, + "acc_norm": 0.640993265993266, + "acc_norm_stderr": 0.009843424713072174 + }, + "arc_challenge": { + "acc": 0.29948805460750855, + "acc_stderr": 0.013385021637313565, + "acc_norm": 0.3387372013651877, + "acc_norm_stderr": 0.01383056892797433 + }, + "sciq": { + "acc": 0.922, + "acc_stderr": 0.008484573530118583, + "acc_norm": 0.93, + "acc_norm_stderr": 0.008072494358323499 + }, + "piqa": { + "acc": 0.750816104461371, + "acc_stderr": 0.010091882770120216, + "acc_norm": 0.750272034820457, + "acc_norm_stderr": 0.010099232969867472 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/rankeval/8b7178b58b_4_lm-eval_global_step84877_2023-02-04-19-09-29_4shots_backup.json b/8b7178b58b/evaluation/rankeval/8b7178b58b_4_lm-eval_global_step84877_2023-02-04-19-09-29_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..19493a615fa2782c480322dd18977b35b1037a18 --- /dev/null +++ b/8b7178b58b/evaluation/rankeval/8b7178b58b_4_lm-eval_global_step84877_2023-02-04-19-09-29_4shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.324, + "acc_stderr": 0.014806864733738856 + }, + "anli_r2": { + "acc": 0.333, + "acc_stderr": 0.014910846164229873 + }, + "anli_r3": { + "acc": 0.33666666666666667, + "acc_stderr": 0.013647602942406401 + }, + "cb": { + "acc": 0.35714285714285715, + "acc_stderr": 0.0646095738380922, + "f1": 0.2275946275946276 + }, + "copa": { + "acc": 0.8, + "acc_stderr": 0.040201512610368445 + }, + "hellaswag": { + "acc": 0.4509061939852619, + "acc_stderr": 0.004965670398127354, + "acc_norm": 0.5998805018920533, + "acc_norm_stderr": 0.004889210628907973 + }, + "rte": { + "acc": 0.4584837545126354, + "acc_stderr": 0.029992535385373314 + }, + "winogrande": { + "acc": 0.5824782951854776, + "acc_stderr": 0.013859978264440248 + }, + "storycloze_2016": { + "acc": 0.7081774452164618, + "acc_stderr": 0.010512588616199622 + }, + "boolq": { + "acc": 0.5883792048929664, + "acc_stderr": 0.008607357686607963 + }, + "arc_easy": { + "acc": 0.6439393939393939, + "acc_stderr": 0.00982545460841631, + "acc_norm": 0.640993265993266, + "acc_norm_stderr": 0.009843424713072174 + }, + "arc_challenge": { + "acc": 0.29948805460750855, + "acc_stderr": 0.013385021637313565, + "acc_norm": 0.3387372013651877, + "acc_norm_stderr": 0.01383056892797433 + }, + "sciq": { + "acc": 0.922, + "acc_stderr": 0.008484573530118583, + "acc_norm": 0.93, + "acc_norm_stderr": 0.008072494358323499 + }, + "piqa": { + "acc": 0.750816104461371, + "acc_stderr": 0.010091882770120216, + "acc_norm": 0.750272034820457, + "acc_norm_stderr": 0.010099232969867472 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/rankeval/8b7178b58b_5.json b/8b7178b58b/evaluation/rankeval/8b7178b58b_5.json new file mode 100644 index 0000000000000000000000000000000000000000..fa05b42c18384aa06d01e674aaa242d7fea69693 --- /dev/null +++ b/8b7178b58b/evaluation/rankeval/8b7178b58b_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r2": { + "acc": 0.326, + "acc_stderr": 0.014830507204541033 + }, + "anli_r3": { + "acc": 0.3458333333333333, + "acc_stderr": 0.013736245342311014 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644648, + "f1": 0.33534439416792355 + }, + "copa": { + "acc": 0.73, + "acc_stderr": 0.044619604333847394 + }, + "hellaswag": { + "acc": 0.45030870344552876, + "acc_stderr": 0.0049650784774355715, + "acc_norm": 0.60017924716192, + "acc_norm_stderr": 0.004888601874547486 + }, + "rte": { + "acc": 0.48375451263537905, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.5674822415153907, + "acc_stderr": 0.013923911578623827 + }, + "storycloze_2016": { + "acc": 0.7012292891501871, + "acc_stderr": 0.010584692134739974 + }, + "boolq": { + "acc": 0.5801223241590214, + "acc_stderr": 0.008632045504781744 + }, + "arc_easy": { + "acc": 0.6426767676767676, + "acc_stderr": 0.009833205612463114, + "acc_norm": 0.6426767676767676, + "acc_norm_stderr": 0.009833205612463106 + }, + "arc_challenge": { + "acc": 0.3165529010238908, + "acc_stderr": 0.01359243151906808, + "acc_norm": 0.3370307167235495, + "acc_norm_stderr": 0.013813476652902274 + }, + "sciq": { + "acc": 0.932, + "acc_stderr": 0.007964887911291603, + "acc_norm": 0.929, + "acc_norm_stderr": 0.008125578442487914 + }, + "piqa": { + "acc": 0.7584330794341676, + "acc_stderr": 0.009986718001804461, + "acc_norm": 0.7600652883569097, + "acc_norm_stderr": 0.009963625892809545 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b58b/evaluation/rankeval/8b7178b58b_5_lm-eval_global_step84877_2023-02-04-19-09-29_5shots_backup.json b/8b7178b58b/evaluation/rankeval/8b7178b58b_5_lm-eval_global_step84877_2023-02-04-19-09-29_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..fa05b42c18384aa06d01e674aaa242d7fea69693 --- /dev/null +++ b/8b7178b58b/evaluation/rankeval/8b7178b58b_5_lm-eval_global_step84877_2023-02-04-19-09-29_5shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r2": { + "acc": 0.326, + "acc_stderr": 0.014830507204541033 + }, + "anli_r3": { + "acc": 0.3458333333333333, + "acc_stderr": 0.013736245342311014 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644648, + "f1": 0.33534439416792355 + }, + "copa": { + "acc": 0.73, + "acc_stderr": 0.044619604333847394 + }, + "hellaswag": { + "acc": 0.45030870344552876, + "acc_stderr": 0.0049650784774355715, + "acc_norm": 0.60017924716192, + "acc_norm_stderr": 0.004888601874547486 + }, + "rte": { + "acc": 0.48375451263537905, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.5674822415153907, + "acc_stderr": 0.013923911578623827 + }, + "storycloze_2016": { + "acc": 0.7012292891501871, + "acc_stderr": 0.010584692134739974 + }, + "boolq": { + "acc": 0.5801223241590214, + "acc_stderr": 0.008632045504781744 + }, + "arc_easy": { + "acc": 0.6426767676767676, + "acc_stderr": 0.009833205612463114, + "acc_norm": 0.6426767676767676, + "acc_norm_stderr": 0.009833205612463106 + }, + "arc_challenge": { + "acc": 0.3165529010238908, + "acc_stderr": 0.01359243151906808, + "acc_norm": 0.3370307167235495, + "acc_norm_stderr": 0.013813476652902274 + }, + "sciq": { + "acc": 0.932, + "acc_stderr": 0.007964887911291603, + "acc_norm": 0.929, + "acc_norm_stderr": 0.008125578442487914 + }, + "piqa": { + "acc": 0.7584330794341676, + "acc_stderr": 0.009986718001804461, + "acc_norm": 0.7600652883569097, + "acc_norm_stderr": 0.009963625892809545 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5da9a9c014b40b5abea71ad7926e781676e76ce4 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2710d07695f9bd1ed6a465df8c039e5993f86c15efda40e2359efdc7cd2d039e +size 208731415 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b13bbcb33fd420690ae8bfecb9866dd7e6d63d39 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c299cfb7a159c8e45297be3700920c1b3f53e2d247f6070ab8dcef8ee64b0d4 +size 208731415 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03bbf90e042d57a69b96313242dbe254943a95c6 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8591c05ad4a4f81c778b6c47eb4ebfbee35c3fa7aacb92e791b4445d7fcf92b0 +size 208732183 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..837de0a05e6afe3740ea7b7ed19c4ab478c0a8c0 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:686816b7db3fe9da8c6274625eb5a408e171b03c9cd9a808e3d0646708639589 +size 208732183 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88e176fb1b309d6a1a3959978aac1a97c1c3215f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fd065f7498a611c8b924bfc91c537c9b715fed7b975814a2880a98224e6e8ed +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba5f44217aae6404240071344a0a1adc5ae46d61 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ada32fbd5b1337061e850d3bd497a4773523f9e9825b895d6651d8b5cd44515 +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_100_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_100_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84517e6b751a570f073c3050ae8b7fba9729d355 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_100_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe22aa46d9363a2ea00ca3ba4d5defc47a4b3135029b2c4417ebfe88c6a91e0f +size 208732269 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_100_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_100_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21172ec8747ae16d421086acac7d5182dbe9725d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_100_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a67dbc8bd3b6fe2b1a6f3a1f808ae1993b996759e7e3824a785fd6be123d8a82 +size 208732269 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad26bb1a09b872541972a5ef5c26e143a7820f42 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a5fbb8c1fbd1a56f6b7c6293defa83b1da2cc5e102a05cfe42a4c19a74daaaa +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9524b6ed92badc33516b4a4d84510612fe9826b --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43a3d82eb5114eaeb99fa9c4ab2a14797a236963d1e159b07762e9e9ba0743db +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_101_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_101_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..816358c4c788eeae63edf658d4e63834708d55a1 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_101_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8e9ebf27337966ae53e6d8a7df053174730e36aa7ef3246600ced85571a4281 +size 208732077 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_101_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_101_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85152dd1d97cd3a3cf7492ad74d421ba1778dbec --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_101_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3929066bc42042bfe328d74154c28ffd8df0fbf82383b60077a68701c586864 +size 208732077 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1851561638f5343647ab4e4e8b5158e1dce77d4d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:579f42e13dee48ec973366eb7ffaca983441df82d5c102b11f070c489d79f059 +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1e54d9e4a30d64387b2c9ca725d48d78e0b8d18 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fa581611c865b798ec483e2b09a2b7241095aa4de91688cd821f57bce9eb258 +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_102_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_102_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..850a04007a016cab2daf8f3af53578aa4d9bad05 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_102_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a79e836c6b94f9f9f1132ec82110b2b0d06e3d4bdcbdcf61cde5736ce24d3a9 +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_102_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_102_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b230a8de3a367ba997c959d462403df52af41248 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_102_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b9f0db35f21e4460db9acb26645419e49025c172b7d525a737ec02c4dd30526 +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..957b04d615dc7ebf549043ba779d2f8b9b056a21 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bab3d01b2ed3efa577dc75a35b8e8c234f28ed191042e2439f31e18f2e2ee58 +size 208731373 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8a6c8f07b5b065649463da91d271000c67d1445 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5e6bc92eaf0f31c6548d57c26a337b6823e90a3c03d7ff16cd3685d5e7f8cd4 +size 208731373 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_103_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_103_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10f3c5496dda00abc0078b3e5c495bc7fd956233 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_103_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00b386978a05babc2bfe64894934dc27d167767d4e7bcf89a8b9edbd597a97d3 +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_103_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_103_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ede0f20ad332de946e3f8c95ef701af2039485d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_103_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10be80d4f918d39162d5a6270b2b7baa79602d4e3e19cc4304b4449d0055c91b +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..415c37cfa7b823c8d2ba2370538d633a0666e514 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9caa8da7e9cc1fefeead4c787b95bab458a3f029ecbec8cb0fd4902b33addb79 +size 208731501 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..859d0491a25e5e1899aaf3e7356836eebfcb951b --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50ca5fafb16cb3bd113dfaf7551b71a65318ed98dd3d4bc70ebd5ac089ea0175 +size 208731501 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_104_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_104_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9e8fe9fbf0780aff1db5bf7184b1b33636acd62 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_104_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14d3eb78ffc73229db7007a3c898292c778dcccdda98145f82a78df44221a8c0 +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_104_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_104_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eda5caf6d26536a7525d5411131933a8875e1f53 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_104_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:696ab1d09e3fd6763d939410c5652734ffcd1590c94827755fe7054bddee9ade +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2109087a3cd2ae6a0ab6a9f633590ac1607f373 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9873eb086cf44a685f510deafe7c3f56ea151586e3706accc48f3930f4656bb4 +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27eee12e77461f44d242abd56c2afb1a0464ee17 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dc576274f3152be80c38d1fbba4349c9fdf890ff84dca1b2bd293da97e134ce +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_105_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_105_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b99263f085a3b6c3b4aa2e8f8d06d47c5d4c129f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_105_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:369f8bf912dcf0ce471d1d99f459a0048e407337e3de15c44943dd36537adcd6 +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_105_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_105_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..159e4d100b9f366a69ca0867da65dadcbdb884e3 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_105_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d707644b9c08659a00f3c5c35815df85e78d579089b329d9ef086f53c31feb7 +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35de5d0b352186ab4e6345460c793fc37ba9d24f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5127a63bed85042507564a90941ed69c372bf51688f3ce4f830cda058f506f03 +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4839698a81af4a63468031d70e008566dcc2a891 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:416400302dd69b6e367a179ca2aa8febcde7a685430db817eff73ad520f284db +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_106_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_106_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..795a6d65bd85003c33a2824ff2643e411273df62 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_106_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dd289acc03bad6246ce0ff8bb828e856fa076004f1ae1fed98b3d8ab210bbb8 +size 208732269 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_106_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_106_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f92f60f0030aa173075b1b8e17ca10df05dbdd60 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_106_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85ac04f1c6e3ef14cc9c5fbb0956f5c34000173f98b1e9292f2aa56b026ee474 +size 208732269 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f3069cd1980f4ea27387066df8eb9eca4f8c064 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e76ed93a0bade4c7f5139b5a3f6178f2962cbf83642b5612a9bcbb1d3878eb9f +size 208731501 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50c8f5feb21ee6d4135e877ebda8d2ad136c5423 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e2d43fc535dca6804824cc9e60b21a45c927ba85245d15b651de5ca833b6343 +size 208731501 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_107_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_107_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c55c36a165d6a201549ef7ef58d0e045d7cb36a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_107_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8308817ec8e93249b008dc96a155004754910f1549ca0709196ef409b24c901 +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_107_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_107_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0da9bc8f352149eb9b88b82e1a8ffbdceee626f0 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_107_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86219f982bba46c71346243db3ee3c13838a734e35aa10196365bd7e6555916a +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74d0115cee938d90b3a1eb4e1a1e1441cad8e24d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69e5610cdd17a99df1647b6c8c593532d826deb297dafdfbb81b986a47e34bdd +size 208731373 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..450807725cb71d41347c98f09e149701392e4698 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bf84f9a036381764312bff20b8063d0974a030406cb398656b2dd804e97669c +size 208731373 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_108_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_108_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1967e056d1cfdfab65438046034f2660e9831730 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_108_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e69baa5a5373bcb93e564b4092e8b72cbab2d1c9231e7fcd8c62b746d13a8be9 +size 208732141 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_108_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_108_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37c58e57a974f3ef8ea771526cdbe04cc3a3ddfa --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_108_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d341e5bc433e98abb6df7792aefc81d15421b184fa2102152c295b78964d0482 +size 208732141 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee4d1f67c917a4c6c1ec19c859db8808021466e4 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46d85554ff454513ba51a6ca590a7ac90724dfc518b9fbb2301c2d319c2a8c55 +size 208731373 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e50fc11e81b0f6dee0a0df2451b1016cdfb277e0 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1d8dd403106c220e79c211dc04620d9044cdc776c65e5b0fa47fd9a06893a5a +size 208731373 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_109_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_109_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68fc9f703550fe5d222d5d1c059bc35855d6efd4 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_109_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a15990f429ed2f7528cd14f0fa3d3d734820bc58fd8bca34dd4cdeb78d5b0dd2 +size 208732141 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_109_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_109_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cf8c54fc6aa940bb942194615ff0930727a702e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_109_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbe0caa03a06dbef0c44a833b6df876df62b77b33907ca254f463334ce2b8314 +size 208732141 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be05eca21bf145c830adda833a0b4323e34401fc --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7005a28815dfc65cfdbab844679dae5a0e9af65968aa4a9f88fec97cac214858 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83c82a37c6d2d4b1585a29b5d3ddc4746da84225 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e48f841a9995a9273d7146d99f25bc0253427d2d86ec5f0d8fdacaf52f282767 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dfdc509e3b206a88282af1905819c5ad591b7ab --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a06a53cbbe5d27d0c7ec5ca070ae2c34c31d76825c927438db8ee184a8a524f +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..231d9f68280806d22f0183bac0a224b64df6522c --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb1058700231a922a2ce935ac49e088d5e36c0be0799305b5857f3c60bfd40a2 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0a767bf1166a73f050c7e9483b817a83fb1a5b9 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b57da46be5b42c71cb17418dd119453823fa4b0bda1d507f7b8bd410c5ffacf6 +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a0987b4e3863db6dcb09a810567c205f5720e3b --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:503e0d5f347f03151dfb458bdd1ed6e86ce43d9e663d4bba128a6bfacecbec9f +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_110_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_110_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63ec560b79482eb26e61502a33db36577f10e0ce --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_110_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac4cee7e5c5531c4b98a6ae54d24a684b5be8d795b5ff474287592722ddea619 +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_110_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_110_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58353c2a94248998d7ece2ab105c5f3ee1f91791 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_110_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0cf684f8d421474f95c5cbda804ff8ecbe92c73184d22acd3463f249cdef302 +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..282930cab844cfe8f975e56cbec182d2a60e18ad --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3b87e6690b36979580f56b477afcb32e2ef5643aaeffa6fce99a3078dc8f54d +size 208731373 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e91556c531d861eb824af32ed62e642330a18f4c --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c9f251efce1fbedd3dcab7913b9a1e00a66d2eeeb966bdd2aa43d07a648ff3d +size 208731373 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_111_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_111_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbd6df16c6e628f882b710faba8db046b48af632 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_111_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61f036fe81ded84aeb4fc8fb752a797e14e7c38d72007b757ee84991f43869b2 +size 208732141 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_111_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_111_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5004763cf1ff9d39de4e4cbeaad4c43d0dba7bfe --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_111_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d2b4aba37da43e7ba95ca4f3a2f93d378e92167359e59fec2da6d1e8781edf6 +size 208732141 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15d4b1810ebe56a3a2a172c5b74a5c78a06297b6 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:323a35c6136abda4e2c9c961015291f1a10aa07d5e980d5d1dbf20c76fe31277 +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8240e53220c41621b9c463aa5695204bc9214cf --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da05ccccb919d7ba3906ec742505b360ee0fdc63da7f95bae65a18d83f2ed771 +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_112_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_112_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01fcd46f189279b202131553d64c4b6e9036458d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_112_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:947b1b1b833d65d7e2abae3925684fee3da8ca0e99ead68ad7852de8c7f638a0 +size 208732269 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_112_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_112_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..657230f5c1eef65aab4a673bf23847598d4a3535 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_112_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82eaed68a02c59727f574a68d75fdcc6f6409576accd9731613534f41debd0e2 +size 208732269 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2dab19a51b244ac288729b110a1b96e8531bcce --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9b9d9a474b8e1e6f32f9545d11eda5cc9a2350f39b5bfd7dbaba80450bffbc8 +size 208731501 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae81e46c65e27e930765fbc0f656714c60775f78 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73c5cb042185f93d4187002e5b04e0d3142c0214c6c1191de9c387a4529b5313 +size 208731501 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_113_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_113_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d56e8ae02f2777858e62d272cb75fea64c773542 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_113_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e879ce34d73b2deb4c55e7ae1cddd2818ad6989384867e9a66f52e02c8909cf6 +size 208732141 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_113_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_113_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5bf6a0add20b5862af5daee88bad46c502721a5 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_113_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a44f575048db5882b6752c28575c37237595c79fd2ff59600dec65ce6af41896 +size 208732141 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4eda8a660ca6d46d1ca468a95abb4f7eb9ccd5dc --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:894d0d24fba96a15bc0faf3ad4bf3184d2174937bff98efb58c341ed518e3fb8 +size 208731309 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a56abf3a45317ad7906ce573424c8da3cf5836f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fb910072f2e8f88e993cee49b5986d3bf4daa72338951ebd0ee81000a57a14f +size 208731309 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_114_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_114_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0b811f538f55b65bc85e94f76cf35b6c4e104f9 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_114_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ee506e518ef28b4a909ee1020d29e0627de5617430ff09c0d6f9c83140874b4 +size 208732141 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_114_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_114_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24470d7394ba30d9fbf0f5dbac3068f8c6c0c9ff --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_114_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f2783b7a9ddcb2cc73767e7029b8b5465b3bf1ef047d6a34d4becf51a1bdab5 +size 208732141 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1875b606f538bf791077857400003a5cc1cd02b8 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17bc5a881ebb042cbf448292ff2911bc54d4c18c5231d8f7928f30ac74ff087c +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..031cac028b61cffcb75cbad4ba0ac33ed8bf72f9 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:854d4d787e49338da801fc17175fb499213629d4c14f832dca9345949bd7ac45 +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_115_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_115_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..929f01b65152512f89f889fd95a668f2d9fbed32 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_115_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02d7c261d4e754a899fe540eb69d8cf6cdd015d6eabce144d5874a28185e4657 +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_115_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_115_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18f240b5d0a0f9743c8f73c736166c3044569d77 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_115_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57fe7aa1f0d3324bdf57dbe031e05f94419721c0c9773c059156c995414059b3 +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cf3cd05c225cd30de2a5b63e389ed5ccab848f2 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:878c5d60163f53d096ac02d795ccfe3fa36436dbe3ddd80e343099b21cd57831 +size 208731501 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb4c555ff13f22498a51f1629178fc0ac011d231 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4af561e1708da49571a69fa58cf65246bca6c059970ceb7683baf02b6f51ca10 +size 208731501 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_116_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_116_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc35e8cf57efe42c700f1814741799a63c3a3398 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_116_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:deb6b647de2e0b39ec293750bcff8ffc05d13dfd843cad35973e591e89e117ab +size 208732269 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_116_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_116_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50eda3882a1ba6812382bb89a884544c5444b740 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_116_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44d8a91e63b79d885a464011103c9a78cc610467cb5c8025124dc784c8b0741a +size 208732269 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89c0290559e8ad3b6182eb141b3c4e2af8243d60 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c01cef295ff9433e619d13502cbefb129728b50d2f5360795d5dfe0b608031cc +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d3d2ea2bf3967fca49a663f2e4e3c2b85a65807 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0474056aa8d690486bb686a44bcc46c51b01af22e54a233858563d8e74b941a +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_117_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_117_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..658db209c3e833927d2251c3a8e2c01f43d1af7a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_117_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fbfabb601922b09f996117934a9b5798492432d14997a64327953e5f4a37a8d +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_117_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_117_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa1ee7658a0772504b4a91637f88bb7f587d3f94 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_117_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96e6f8eecbd7e52d9fd5e45e399ecdc3eac0482cd6a8f85868938675acda885f +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfc5ee9ad829a3335505b88563300c5bcb30232b --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56d81881f66169707ddde13b55f5882bb5f8c1cb3564e3ca5749425adb6a0ec4 +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c65d777ef4b3c58ef13848ace2cad17ba73459d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:404ec4d4cdf6ca3f6a978695c0d9a918d043737302dbdece0f96675ce0cee623 +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_118_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_118_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6867786df83808180681c3142f232cb1c15180c1 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_118_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a59657a7b71ba41446b0f9fe74d8083d8e370c41293ac6e81c1b9fe95970ff0 +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_118_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_118_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29357e380560aa4dc9dfbf36aecdeac0ef6d3fae --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_118_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15e273e3214b5904ff6606ca4c729fd1c818df77cd341d4a20cc04735821a1cb +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc71ddd23d7424c1ffbd5d04d5d6c35d21acb480 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d6076a322d09d7238a0c635d103dc8ef729a34509885365960a2112f5a56437 +size 208731501 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a126fe0abb949d291deff119fc9e960410d4f6cd --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8f0930749cefc03b6e7d4bcee9f452323a81b2a1606b08fab636ea5d29fdd9c +size 208731501 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_119_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_119_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62abd590f45a04a31ba7375d20e57ded99fd435f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_119_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14d51157dad17aadaeb622bfe2883186672ef02d87834843abde095981ef0fa7 +size 208732141 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_119_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_119_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5535012195b2ef73bb99565a20dd0c02b9565cda --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_119_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8ad64d7e5f966d9ed12f0bfd85c8184435e3b2027cb2b1770bea1c059435ee2 +size 208732141 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0615162ff0554eb2e94c9318684897bf56383f4b --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09c46ecc7822f0bac70c9c6216e0dba1323d2bfd3f5444d0665c67671edac545 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48752c917f0717df65dafe032f57084d555be9be --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86b71caa2461fdebd8b86e4080dc4e1fe491e4821590c1383cbb614ff0843345 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b86b997718329805c43be3059ef8bac10940365 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20168649ff27d8f10548f1282b02bf98fb1bf985cab9962ab7db7b0e8118ac71 +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c488982a15b60c0997af84e2a3dd2087cc0fb31 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f16c39ab5ec50bad287d445c058ba9579c4b6d4aff306e6fef72c38abca0a9c6 +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30dc0c413976962d0053e8c060c130f3941a67ee --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:171ef2eb91f37539989028c8c327f15110beeb64fbad07120b03a63ad78e7097 +size 208731373 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5003c8489bc5d558cb7addf0def095f42e3fd6ad --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:780aac1e250c4b4ac0d07e55e5bcd017f130e673a107c623a2eb89440783b31e +size 208731373 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_120_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_120_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84d9186af285323b41e8a60c329330f6b70a99c7 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_120_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8f9874398bc446fc4e1afe842dd260c56e9f2c7cfd31119e72c8e2e4a64156b +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_120_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_120_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f82c30567190585a5ac4cf1ae49d9f6358364d63 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_120_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abaf17aa681eadde52017794ebb9aefe7173ca5f90056cf348d8f200d1241d28 +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4cdc3639f8e78d635eabcd97f8597180588bd84 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a27a9e616bb5d1b6be8906c47a1ea4b8ce6ce2987dae56d2f0eec29cb57ed494 +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49ad6d54317c0319b9f5d833d380b1cbc1cd5a49 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83aac10582cf78a855c5280ac038ee03e9cfcbca1d5ea45229d837c203db5607 +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_121_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_121_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57e45794903c1b0d99411e87a366e5088debaa3e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_121_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49e132c356ff97dbe8016028e187b319fd5194fb8a98264610303dc1b0a8449c +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_121_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_121_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1eae2319d8fe69a7c5d0775e2d26d5d4d75060c --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_121_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3469a94fd694452a9d676c0ce41016ba257b06d4974ee5380ee189d0b213c3a7 +size 208732205 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86eaaac5f962817c68081a59fe4d1d6de17b3fe2 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adc2ec810e83c497a713e589bf80663f20d30e5d3eb59a71ec237634b975ee8b +size 208731309 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4374f6b68278fcf82bb21b3072b0a6309d218ac7 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ff61adcae682c1efc8eb2c41f42dfa900fd88e7f2082d89d0d0a888e20d894e +size 208731309 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_122_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_122_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0618729e9d1c1b987f9f3509f69901549319840a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_122_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04ad49a252e42db56c4aa20e399a6a2789edb836d7a67ff7a9023a61f6a734bc +size 208732141 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_122_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_122_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcc9d6b45245cb8ac46b836e7c2bb736feb0ff69 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_122_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b1cf0742ae9b6ea2858a77e63553d7a1ce7e80aed147e9deb291f63621814d0 +size 208732141 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1d6288ca6e9e91deab1d68116346214ea412544 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e0ab9f6ee14414af2818282934ee6ce050fa8a41f9cd3a6ed3467406ddcf513 +size 208731373 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f191a9ee8d3fae07780fb8710709f4bfda3bc63a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f255921dbfdd0863f44a9dd0440c825867dd994792e17359d147f7dcbbe1891 +size 208731373 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_123_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_123_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a811199c72eb4455eebeb3c4cf2fec34dcceddfb --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_123_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3be59aaa9c314f007ad7406ef3de8f4c03f98ee22fe2f38aeea33f57ffc0b72d +size 208732141 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_123_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_123_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fe4c531630d830c822bf3420263c94e7f86e799 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_123_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67f51958bf34592c96e982e62bd08d6414f0efde33ea782d7788978c6649d6fd +size 208732141 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71bd4842e5200148ee3578345eb542622ef8dc9e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:790d278668eae1e3340c770afc7806df56a549beb144a1f17055ec66a940d67e +size 208731501 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d06abbb186583fb2ec0b68736c47a9352a5043a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:327406e991ed7623aeaf83cb8c3d5c7a14370108ad5cdcc37bf4c271904d7c12 +size 208731501 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_124_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_124_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0940f8040d5a08106052e0eeb81fe77b55edd690 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_124_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6be6aba3a61d164fb8e0103ae3e15206cfabbda7e37919bb0638e7d9609ea74 +size 208732269 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_124_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_124_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ce17750fef4d24781eeb76a10069661b73276c0 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_124_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2459c38448ca7d6522428dc95df223ba743fb7bd02eeda699483112b5c752ce7 +size 208732269 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82eb4c6bbcd7e1b698d289f0e57f3edb3648d9a9 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d367b6e5d2a25b86296b90cc15d00e3135576d1e989efa78e30562abb61edae7 +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5693606c38a1994bdb2cca8c7bfd173b187fc3a2 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbcf7b4d48272791a9cef8d19385f3b0055a4e527e7251870d8c979085cb2812 +size 208731437 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_125_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_125_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef85d0df0f79709117d3a780f0ba5341a776ff9e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_125_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:577fab3b770ca82d638f00e875a4d81b45a5c0a9d55ec9269b6c37ce4b3c900c +size 208732141 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_125_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_125_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12a5d0115a4274f07f44459fdd38dd3fd000b18f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_125_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c156624c33fb886feeaf0004e7442d636e6e41f7b321d8a56230d10e5c3cf3d +size 208732141 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4d7ca91225b62b08b863239058e7864e06771f9 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d12120e96e09d3ca4f9735de3827a21ae8a07573b1b294ac1354f465457e74a +size 208731373 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f9ab78cbd7a089a9a02bccfafc43979ffa281d8 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8293fa595685e7e6f483aeb3c108388bf1ac9ba54a25ac2bfe52ff53730a1e8e +size 208731373 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_126_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_126_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a04339873e39625955b368581e7a2b75143bfdaa --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_126_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f87d884db154e85adda77a25047be5f327d230090dd70105b8b1999794d80964 +size 208732141 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_126_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_126_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ef10ecc61eefd80865c7d400f2efb8ccb1231e4 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_126_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a1def80fa5ddc08aa5f631ccbf55fdadcbcb5d1d7e6d4f969a66c1d10fab054 +size 208732141 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6fca8cee9276b36087d27227218365165c8cb14 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8da1133999a1ee92195cb31f5111d73e994a17b6f429119525b096cae7e3ff9 +size 208731373 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2db0b48e8e32840fb28381752fcb245ecfdc9dd --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78977fcd1d3f46f9a5f055d1fed902824d44e24c39f839f903511faf8933c280 +size 208731373 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_127_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_127_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcb07d0ac546a0f239a60a07b385b9a8e6d13260 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_127_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d59a334bd110dd5653dab7c2fa0e21aeaf9fcaa69aa87d707837db8191c5719 +size 208732077 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_127_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_127_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e24f54cba42a211467296e174e24c154d1e79ed2 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_127_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4069f28e875343d1152f75468d7c29604817c9d8701ac81bf28cc61954c7f8d7 +size 208732077 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e290e16e2ab177b82e4ba6b9b0436d4185b3218f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f653873de87e46237389720b2fad19a99f4b9f749b62e886563045ee8cc111ed +size 208731554 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce2c7481a507d7840806501615704ccc7dfcc8e7 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a299f0951d73f2b2209c980692c89993a7e78365c739ee5603c37b11b47ddc0f +size 208731554 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8faba0924b632678439ad242ddc264883b4acb6e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:737bca42aa0d65e640c6ca42b446bf58951c0a7acda6b64d6c9ce69bac9730f0 +size 208732322 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3f45a6fde477528d7e3aeba5a7d9ae269504cc5 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a236e231f666b4c006fdab99e1aeac960a5d28d25267501143c7ab93f4aa8225 +size 208732322 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6ce9771dc31a1fa63e139ebc57133511eecab1e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbd048e82173484f29eb4e5f0493f56dfbd5ac38f43f759f48fe8d2334ad1780 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed30fdc3777d9a9402b095a888213d15a8e16b66 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb0699700b76f2d7bce34d4f2765ff12f07e2d76ba6a8febbc999284c13ed287 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4cf63fb7c9753c885a2e60a90644952addb67e6 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64ea05f7130e3f608f8c9679bf3c5aa8a7c133f8f464a2723ec996ecb533d1cc +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf046de21cbb5e39826d411641187b5817cc7c5c --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9571f313f0099fa0587edb841183e00a39dd6dfce6ff5712d8c3cecf2286790 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10012193c221d6e557e2dbbd2d9c30c157b86345 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59aa22b1a081db98da0ec1a2e3c92421e1258a0017f3dbec9b8b727d03e9d684 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3148a2c0c807bfe612f40ccd0182fd5eb1ba5aff --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19a5c4086c50c8edfc4e94b82f2648bca91a076a12632faaa2deb6cd16581713 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbc5ea8b0e7ad281a502170f47289ae2c936615d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d54056c73765a70144555169971cb47eccdee18792da1ec3e3271ae4adce01e +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d16ed856d95b7511e58fe78322040b30b29e198d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36b3ec7bc41a8e2e89bbb29a976e3bb8140b11293111fdf56cf8b4d42a9054b2 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a785d0ea2bb3a6a7ed9c2838c974132429975cfc --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ab761476c68b72a2de2dd247078ec312ee32fb85e6a9cb95de34251ceeda38f +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..805d5377b5a517729fe91259fd51ddafb8ae73a2 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c7d1e272f5e0e273005a52697cab524a976c89036efe7e743df00fe654968af +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d52eb0b71e95ad6691c2861161bb26d24c847af --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39fec707bf4118ed767823850ab70343a4faa1e99dfc185171c6f573587fcc4c +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b50e89fcd87cf474cc8242999e6440b1ece055a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bbae8c21bdde9466d5d8e518c60b211bb95fa4550da89c95611a5fe02f74e2a +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42563075d36503e1db56cf42453119fa76bc054a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3ee4f7068e66d92487f8e406fee00012b77e16354584b89a541ae059299e23f +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bafcb392e15666004c7ae01fa2b251df76dacd3 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b3ae03dcc1ba5874e7d9574e14ed7a67aac51a97f42ada25ee4461cd4030691 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_16_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_16_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..781df158f3f80fedd0b1300022cc4692ee2355e0 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_16_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:815dee3764a43f0489a1461bcaad72593e70e2edf87b9dd9e01ec807ab8dfb3a +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_16_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_16_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf76db2b4baeef5944660d2d6f1c62be9e0c58cf --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_16_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c43eeefd4986b33fbc1554f170d278a787154f72dbde833b8dfb4c7af543369c +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f205eb2d1ca95c861bd2e96d0d0cd2cb3f2dfcd --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cebc2f31689ede337c85b3c1eb58acd710da6d9cc2ae2889c1882886006ecbfe +size 208731298 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5aabce564297d2cf0b73d450ebfa06d11417c16d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2e295b4c2901705ebe012237ba3fbf6c68bb8f73b4ec2b1adaea257339e4837 +size 208731298 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_17_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_17_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d32f69ce7a7e888789b626cf9cd3069d2f13701 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_17_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:400e64ef4ae77b226c509378868eacaeb3f20493d9e4bd7287c90c1afaccb131 +size 208732066 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_17_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_17_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04bf28d21d885e68b32ce74c039d48b10c3d3e9c --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_17_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7140402d4eded1d9b29b080d400fd912cacf8abdb02a67d7a9acf3e9df45673 +size 208732066 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fcf7eac369327111845dcd4e7c0373e2d64d917 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa318e40a82e7d6764b5ee3be64163748551b0fda38f718f43e8c9bbe9c7eced +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f20241b2c7b30976ed92fe6a7bfeb2cb7b319558 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca2afbb63879d5c36edc3a27885b814f28139840b3cc95ab6b50008498f4d5d4 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_18_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_18_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12d87efe5032ad484c9ddcbf9f632aec8f752684 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_18_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da34cb34c1252c3714a71fd1017c52a746bc1c28dfd278db0bae3e8cec074112 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_18_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_18_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0776ca3dacea4f1b8a09c23efbad9a79f3c9def --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_18_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c83251f806c636b971291390f7e20e2636765783f29b846b74c24ed92019489f +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea92d95071c612a88777ebc421b63a750d97fc41 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4582e839e390f5d47b274513296b182301bfb9c2bc4173b1b6e6a06209eba707 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f7b7cc8971e605fc2dc2c389fac2dade5ddded4 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e6c20fc45847eb315574a972fd80429e172c5ef9cd8fa533bed71fa7905ee06 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_19_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_19_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d8c545f777a6a8c3b05853092ec34acad7f73d5 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_19_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9210b149b709163abe95b8eb3836ccabdc7414e61a46b1abd57738e32f19034 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_19_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_19_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cdd543d865d10095f68eb1df151b35b5602f293 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_19_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06c19bc053862580a00ee799ea1c5bfba945bd05d13891596a24e3e2a4261dfc +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cce48139bc533d796d6962bea343283d1668119a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd9c7ebe2b1df3d7e0990c98cd1c3d92ddc47e5eb9391b1c1019be59805a9642 +size 208731351 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35eca3ab4c2b29be025bbb05c817a9d7a005b9e9 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d5a6bc4545632d8db6d8fee23c5dc58ba5073dbea97e8cbd968c6be1d3b61b7 +size 208731351 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3814740f28630ece72d15190da5d9a4b358b3624 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5375e1661f0f71abcaab686e02111192a5c7715dbce8a7d0a6cadd05ecdd0e1 +size 208732119 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea64211cace8b4970d555c77c8ec71757dbaaef2 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f4c82c0d9ba74f87c59c728a8f2aa32db8c184cb185780a8d0d79625f380f42 +size 208732119 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cc30e529e1948ae078493d2fca27495041938ae --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1634913fac898b8a09d41b71c9f9b25e077771402106508f3c562f8ec7904a1b +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e45525c42b9b28a5e7d7cf8690644dfbce5b0797 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6fa07e4e05bae8c3d50096a54949c56f6206b38cb0620bc600b47884ac460a1 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_20_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_20_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4b338305e038e4f380adfa9086b56f2d34cea86 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_20_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e630473b2860e27ab97ac07972ec8afaffd526580746bb08385e2756d60e7df7 +size 208732322 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_20_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_20_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..841ad4209b2bdd5479d63da41cd7fa42d5c77e3d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_20_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:922a2e676fb6d7422603f29235bb603570a096280625b1255deb6bb7abfdf7ed +size 208732322 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12d1c3e730bde8ac66672fb42551cfc74ab8a767 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7ef5f37431c897d61875574e30c9438d33f4f9635f3f102a3ba5d703a961fe9 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57b29c21c8237acd6eacd0025b4ac492f785f95e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b1196278171c63b5d70b7a8f59053c4f8e081f08f33dc5ca8548eb74f995c2f +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_21_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_21_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e432b5384360d1c043a7492353287179606bc247 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_21_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:225a5d2d88a59790a1483f0ee204184eefaad3848d79a6032dad35219524f5eb +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_21_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_21_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0757c877850f6455d42c381f909cbe33a7ff1750 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_21_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:892a0d3a2d4c87952283855f99caeee58b1eced97ff117ce0f04c7b832696bc3 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30fbb765888f7e4423c862655f4ed02507b77c78 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0a16ef1588b4ccb71a9a39923c6c2e91e9b5b66cceb61999029f6d15ef4520a +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45aebbeb407ccf8a45ce6c2922428da372bb0b39 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec190cb9cb5b0372bcd1e959021ccc9813fb3e76a9b165f3ec23e2530ef424f8 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_22_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_22_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcd3a1ac95b76949a686298f4218bdf97d7375ee --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_22_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0ff4344e2fdd925d5e303b7d178743d24ad78bc3499b916fac0aef80b47d183 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_22_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_22_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95d0e23ed1f7ce0ee1b557d07e1a0d85bfb0690b --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_22_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e63fb9700b3edfbdb2b97787527994017f460e468f5207d494cd88ef571710bd +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf162d7484b32919998b1b09f068264198cc7885 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76f7c85e166b45ddb716385ccbf3afe6c540137e1c70648a1fbc316d8331f92f +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05b880b3cda72b1566466cbc1448404219db791d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07721a2733afe7c86dc0aaf57119bbd1bb60ce1f03fa716a29c84bb11213f542 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_23_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_23_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..944989d589c9166b3507ff5d00171b442964e25d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_23_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d63e31227902bd59391cdfc9d59df2917266f01c130bceb982d499127363bce +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_23_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_23_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2e8e0b6b8b85a424450cedfb22024cb1d708c16 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_23_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:320cc49e8ebcc1a27cdb26e7ddb9ab30ab0b5142a6654cf68a9f12e0c794d118 +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c303e3b076ef9f62c73be8df7eceeccee046431 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64f4841725ecc1adeb4a559e46e05ff9f1c3ec0dfab44259599dc844b42694b3 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccb97e57e7da64e8c661b335a320cf1cbc250f71 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35ba7f515d3dd77b3f9de3e01e00cd57fa0f6f9fbf96596c68f10d29a949d175 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_24_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_24_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92726d82a6f9496c4c10ea28ffca6a8a3061f02f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_24_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:995a0bf6e000df567f4c02b1b97378878104077d4445d0d0e5ccfe1346712678 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_24_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_24_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3900dbc69095d283624a9f636d8d75a40ae429de --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_24_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1368e8fd6522e6f4ab8df896e0ca3f7065b554a7c28055ffa7aa2b8977e1c79 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fb982e1f5fcebdc5a0e8f65a77a1283882989b5 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:674a3e64b20c76f65b5e46577e4afb8252ed379db13d3a074bfeaa6774555171 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2755167da0f71bac0d342e42783f7eed10c11d78 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e273233196bd5c6c1e535be87d587d0185cded1d53dd833b1d58815fd6adeb1 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_25_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_25_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e1593dfd3c616349b71b7755bac634c9622daad --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_25_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54886703c06f143c02f077813220d2796e0d42f3cc5bb047429a7b07e774a863 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_25_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_25_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fae575d86826c47fc3fc37392346746c6de13f5d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_25_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8abb146083ed5cc212533c5f1515108eeb33eb970934b0b946dbfc523ed77cc4 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bacb6526ce0e495c18f467e74247c6a00e73e6f0 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16b97be5a3ca4578170861d2b05ecc873d8f3661c92f8dff062a776cbaedf6ef +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2af56bb4369c0f8da91fef36e1984a442be0f7d0 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1b9634e9b25e95259168c332db9e3114414427af177abfc50aabed740b2da25 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_26_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_26_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b95eb14ae0a24c6d41fef623426a8cf243dbc8cd --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_26_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44e09c9576781e4066f4d75a9ec4f2fc7a9de73bd0a29d3329c33aee3d884061 +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_26_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_26_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e36689e3677f0e1d218505913e7df9d8e4edc0be --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_26_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdcd47d8efe0974afa127a483156062769831386b0f521c76e470763c81ae48e +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c775a4b26528933cdcefbc0e585112a159481ef1 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e31f6caedfd491ba53a4db8d8d0a705efde304c181669d7e108a24d62ee7649 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..531ae57ef78b60d8fdd1d9ead705a0e20a15b57b --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e94d01ae7b46b4128048044292b58f6292c0a62fb39b693ae21c9d8cc0d93252 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_27_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_27_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..edfc47af108aaf051aa9ac4e15348739b1407e30 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_27_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70c6199fc1f735b2d2dd9fc4658e37c8f63ffb623d637722ca46e416fba50809 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_27_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_27_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8610b8b91dd6e0ac23d1fcda6ebd31521249710e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_27_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dec5dafdb94df7f2a7433bea295dabfcecebf5c98e9bd6e4c33d23d3c55fd004 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea2eb70314bd87a1ca85fb2cdcdf3d8f2b9519f0 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c91f7781a5f4f3a7df6eda72db984c7f413f97c566c0ac7c8174c3cb8d55792 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8497cff729c93740ccd616c87e3e1bee31eef081 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c070ba7057b17f8e17b7b8058e9ba98d04c30fd7c0fb831e16651208dd961755 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_28_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_28_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2453958855050b899939844f4f4a0f7264fdb1b --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_28_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae27ef3ae66ede42f36b583f07b66bcab6ba87e626448f7d340de79a23f0ce30 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_28_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_28_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b321d5aacf88ea9efcf3553678fd82ab7e190cd --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_28_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2e5600fecee9c7e7603c96d863e316dc8949ad1c4a6ff29d1f88bc89cd6b997 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca67f17ee2ffb37354a523c55af2885aa124f6e2 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cadc7127284a47cf9f1033d598de6adafb597caa13a822327fa3388e054fd0e +size 208731298 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32daf58bdbbdd7fcc15ca70cd341c49123f66f31 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cba5e0f6c7d5c6bcc91a5533dad9e5744d633d8a499e38e63e2e46da6dddb27d +size 208731298 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_29_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_29_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef5f2680e9f1bbb7cb1a78d7dbb624f4a38295bd --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_29_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41666f21b289d1e6bd8a12b1deb0a7d276d5fa200b0b119a20192b09b71ace68 +size 208732066 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_29_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_29_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6ae016a52ea61d7163e9f8ac060b88da4007f45 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_29_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be30a12550bc35786b394319ffe3934e497a4b6066af21567c17e387051373c5 +size 208732066 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dac81cec94ccc4180272accbe8ab9990bd2c45bf --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57278c00f8b7d5040bc7a5aa04ae24e279237ef68348158597185f24a0c6784c +size 208731415 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da7b93f18f0c4f3f1157d66edae424ad414a4346 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2232473306e780e7918230307c8baf1eb3a4e3af2390293409200cf2a1958c53 +size 208731415 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f29540d032ab7692cf172bfc810f49a8b81d37ba --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:293868fa896c996a6e9b24c794079c8d8faec0bbfee44afe2d240cd013a8379b +size 208732183 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..018c52467eb5599ca8445b24ca21c019c0c7d0a7 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc8212cd2f540dee5486a9b9f64d47b48187a241f42718fea827c218cb3f525b +size 208732183 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa0a3ffbe5239d8a57b897a78af940c85fcf939b --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bc03d19799f71ee51552c8a3156a0f8bf5f95ea63566d41f84314beb319edf7 +size 208731298 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca58dce6759baefb70f6ccfaedfc50341bdb3a54 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:708c9858bd32d24e76c4b8f74fe1dfd4ebae855cc09c5d98d52e51b35258e69d +size 208731298 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_30_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_30_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..374e51ce595a0d0e0d0d5e08912f9ad7146ea877 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_30_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdde8880f491c387e46d3c41c58bac2fce5930424bd69a852c8bfa26d433e28a +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_30_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_30_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51a64f120ea5090c920e66fde38895b6975552cd --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_30_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e79f72e25dcbef13ca7b62a4c1341633acad51d55983d579cd3978f020a8453 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34da4997a238627853836ff2ff1fd0a42857e841 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dca95ab71aaed7dca598231926637303b071756cd4ed2d326cde34a34b2c6ded +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae6f1d57afb158b446f8adfa26f2762a2d3b3e4d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b6632dd76bab526702065ed22bf62c8bcfb2c9672b3dedc78b13abe32353b6c +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_31_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_31_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22793b61bc7c48131b3cf806d38443864a5da795 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_31_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec9b9f0127191c0541e36611c6a0f4b1953f727349da5be7d8b7198980d81890 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_31_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_31_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28ee9114fd0c71a4887107312a40632fa8273e06 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_31_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c19038de5b30302d1b3dafc0fb245a60ad0ee774af93b23b8ac4cf6b3a53ebf +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a47a52b1284d58697cbf5fec57a9391ce894716e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1aee55e34ae6331b172ae596e5e4b79857801ff805691a80141a7a5bd367121 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82bfe60e5e5467f490385f37cf26a182cf29789d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4c113e2518de68ab0d790bf90cfa8c937f1d1bc9f1a2cc6494581b50196a4c2 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_32_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_32_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef96b55835028ad83fbfaa73575988de6cb05400 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_32_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4413557fb51dda496ba9746829912b2b65291f75bb97c08f3d4855659dd932c +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_32_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_32_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f0b4220008f7df91a2fa47f3f8873624963fb1f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_32_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0a66e9b17b83dc257a449edc830d14c2268269cdd009318989f44d89a6a0755 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31019f7e0c4087a57fd81d133cc3ed5c112639e3 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33991cba82db68f7a8d4487d4e4dbc0702cffeae8fe751a862e625370d2a68d5 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd65a894aa42aa9c2cc2c83c44d5e2323725f350 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5f1f185e8b2de10da763053e7624658917eebda0fadf65a6449c03f1b955042 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_33_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_33_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45ba5e6994d7114f81983ba2b0ff9886858d4a77 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_33_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5597744192a812308a4d7a2dc869bd1cc4659877c8eee71086a9f30cc1404271 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_33_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_33_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b93c0975da19bf79b8247fa66b76bad8ebb9e482 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_33_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:822ed4f5700b88c7790f2c0338d377cd0ab7d221996aa4d857864c60180599f8 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7bacb6679fa8d1ffa0448a01d11cd491ccb2a73 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a0599591bea9e3e63b7ee82d192a397b130b6cfd3a1eb4c17547d5d0736c8c6 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c09b965542d8b287a59153afbed56648ea52e445 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0826bb23e3ebcd4ce4d39eb82431e7665f43db8a379743d76a9b0db8fccc0506 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_34_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_34_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d05998bfb86c4bae498a1b147cabe68fa8b265d9 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_34_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cf0732a2d5e48085b4127b09ab3dd76e68aa60ba5f6c4128fede8dbca338dba +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_34_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_34_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6e2cd854d9bd7fc2b3939a947adb8a9beaca61e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_34_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e9b68636e7b71655f0e633666dd1a02f5e6a73f7590c3028dd8fa11047c3146 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7ff73e068dc0c95cfe5e5b843dd4b30a3a54431 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef2f1f3ab21112530cc578f9d2f54bd7d049212cbddfd9bafa78429c47c81b09 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58fe82447489d0c75ce38ad706768176d465b694 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b95d27218057989d65ce434f73a3ff49c259a2ee649d334ca252a387bb0c7fb2 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_35_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_35_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b8b15e3807a8923cc3f82e78769936e57dec98f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_35_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8e8d81b3f8ce0eceb423af85610e794f52b2fd45341d0157ba9e4473ed5a42a +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_35_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_35_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a294443613ee6da00b0cbc3cd2d8a756313537a7 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_35_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de9bd8e9e877ba9d76b34959801aad67ccf765fd7ec419f4c7f495cd3033dc31 +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1d268932f12c37fc182dad79bec28d7ff1dd8b0 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39d59be932f7c1ea9c87fe770f58722565dfd262570fe5c739b05d63f548df55 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3c696407211a5d0b8945ce1f25d2e8e5df59c41 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d73365f91b3273762104de87de56fef64f2196cf92c3c4438457c460f536928e +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_36_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_36_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6091467d761aa6ecac52634e707e28cb53883ae9 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_36_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c1bfde6721aaf83d4334acda5e680dd11eb91d17c4a6fa3b66773c0674fc329 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_36_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_36_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21b856e1440b675bdf31774fe4b8178bdd16f481 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_36_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5c594cd3b4408a313e9e07a8940b3891316d65e781b8c9c85e268b6d912aa4b +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef31301942ff6587373c77c431f889cc83178673 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:744a41d5c6844f84f26c96819fece4dfe5bbdc0d148355b57ed7c6f0d432b395 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..419b7fba0363fa8a619cec7ab9f6e7607a206658 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d46bf0d54340f922156e1d76f5790fbecef66caf47dfd00c5db86be3b3903f +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_37_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_37_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50785b1d52a13076cd786325ae1a6f491a8fe324 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_37_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44c864d167d922ffadaa48276f57a6507c39f21817f6c31fc6919e708df90564 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_37_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_37_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d66360ef96d5b2e02e3626ac9ec7741a67a5b55 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_37_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaa8be7b5f3df2f3d89a0f6ad9951ec106f9e6150048e2bf1d4af32236a8c625 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93ed85bdf3764d68cf1ea789ee6b004997e613b0 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01a8b7e547cf9197d3b82f9304e792cd533afd69b5b78d0ea41ecbb934c41616 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67a315cef8e884ed86352aa9240abdac074335f9 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0b9e5723766dea826ee2b86064ec7d919f25e6ff19e2298bae59d674193408b +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_38_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_38_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fc3b2339ef5440c50f36fcd8f44c3c8c070afed --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_38_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:928f86556f3c13830d44ce23199e72fe3f215fec83ac41ebfdab8cdbeddc8b9d +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_38_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_38_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2597a388f990e4bcc5b4f694f14efe744a47c266 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_38_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b117c9f11a1854c0e7654a37ca53c78cd0acb9eb1ae0995c325180ce289abeb2 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d47134e6b6122848653196c854863e48d578495 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9d89f9955b39d6c34d8c1295219d3653e9a1cf18b72ab3cc21626ef31fc45ad +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4a01439b4e3cfeeffc63ca3e6e7501bcbf478b9 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:344370f433e6c9449b8e8c306e4aa5a889d57098897b2911c752a03f947eca0a +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_39_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_39_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26d635b694650b01bbb8bf327965ab442eecf63a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_39_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1c7ffb02bfb85a92f347f1ba3ff6b861c44235bd2c3cd9055124ba61bcf1b3f +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_39_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_39_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..425929966d07a03305a90687b24c816dc1365ea6 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_39_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c784b35a45de1050fc0dd687ee93e6c11e12b60d4a2816117bb874968a4b6c11 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b03895f20000fedf584a5c50a31eabcee3c675c --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b560b6b698ed9d8e58cefcd7d85fad6e4d4d1a3216b7672c6f37e865e6e71755 +size 208731351 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0755ed3ddd19c9175033aae2fb3495c5b99bebd --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f4c8334094e96da4f33d9c24496cc35dc29d6f47b0910ab24e1fa6a1b372ebd +size 208731351 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f47bbfab60e19f3a0a77bfa102c98c9d03452192 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0635ed5aa1c78ea9f42ba1360833693ae1ccaacee70292be25047bf1f29df745 +size 208732119 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ab1f73985c0f1629a0d04d909a6aaa43c2daaad --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2622f27e0b5b2659719388acd513d92afcb1328ca0a9890b49c2f7a0218ee4e +size 208732119 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c2e7c51de88431ec6e914cd9d099377405d3499 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:096e4d850895aefb4dd1238bf15a9dbbbcc048e9c206327ede5083ae44e3bd2c +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..248f93783d1fd33ab01192d8ee21bbed5624fda8 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a659899400bdabf81d501883f119f49f62a6bfb62c4c8240762d9967f8628eac +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_40_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_40_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f35a98867c513ea3349843cad3b7cfca9c9918d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_40_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21a6f697bb9ac3871dd9b5e80c3e106335d178c3b6ef66f14376bd4dd4d89a0b +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_40_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_40_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f7784d162015365aaf5d1b498e7c813394eb6ab --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_40_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a6ad346c5a05952b2a13e384f28aa8a131875f3a154a3b912e0017641808e5e +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..442f69301314842b2466cf5ddb1974e28219f5b3 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d34edd449c8c74f219c8fb580eb885584609214127e40b2461a9b6fa9ed4b6f +size 208731298 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c34b36c55fa086778d71b1621ff5cc9bbd4d393b --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0456453a38075e32b262f65ebdeb20b0a878a3431b3811b061e96035a682a36f +size 208731298 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_41_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_41_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d9f0682e91238e889971b834e43778b4256982f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_41_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bec7acd7baccca25c0b8fbe71d8ee8b4c689145c08afdf715ca09d73230e9490 +size 208732066 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_41_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_41_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc2f237b9ade58244ce677c54c465c4717e64772 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_41_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8421aaa1b719dc172927727de75db54c242a0452f8830c11f478b65f6b21708 +size 208732066 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9758ec604abb5f6ac2a30d46e2ac1e87cb7ccd44 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50c7f3080fc9f34beacdd581f07279c85e809508e085fb2f0c98fce9c7f9d8a6 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..370954fd552d016b1681b14629464e8a32f1e0e9 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27294cd92fad4c20e5cc30fbaa747ba3b8efecac686472a1cb06f989440d092f +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_42_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_42_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..891d1a34666d9e530cd15311cc7622ff3374d5b7 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_42_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9994e457f20185ee92b43372e1a00b8c9445acc4824532e18bf43c095da2d13 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_42_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_42_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48aa0188aec1918165dde82cff113501d59e7d5b --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_42_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:951ac366efdca33b902b4d20a217c44934104bd887603597fafbc091f6220fc9 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db9acca179d19ef5bdfcd2427b97672378af11ec --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2df519126c4c1d5dc610835cdbfa144d1c38d1df17d9f3d2109897f75009d541 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da181f121dc143854260c707acf16fa7daef2610 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d83879c81a3682766819e9000307ed9645586caf61e2891ef6351a41d55f7e8 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_43_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_43_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a2f1e83a90288375559b95e42c6af2be3936806 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_43_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39cceae928587faccac39f970abe71f0c19a40b92f8212dfd4166e15ee99dca5 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_43_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_43_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09aa4351a08b9191593235f6762060b89e9dd42a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_43_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a7f12846a245fd8365eac5d698947a5601869cf0e0c9faf84d8d9aafcfe013a +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae40cb799dc1b4f31c9f8d1f92a510d080bcdb36 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b85e04743f678f2f007a24b6ccf39d09b8209abab632b9b9978614e2dc1bb500 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48cb1beceffb424f4b91f127b449ee865ceb9352 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:000d9dcbb1de39d6a61420b2f3c3fb8c822a034648c5376d32e9fed657704aa0 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_44_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_44_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90cd738f520674be697cfb60229b0ed7918f3b8e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_44_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76546dffe3bf2a302833a7639e146b061efeaf5dbc142a04debde42a6f685a2c +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_44_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_44_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..beb6d0d836061b9361fe5f8b715133f69bb8aa79 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_44_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:289014d387b48eb27e88a923b16d97e0f158f578964b8682d5495873b5f4cc61 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdbc4c4669869a060acb5b73a8aa8f844e3e9a45 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ba9c60824d768b7a69c47167790991a88b6f63246f5bc50a71776a067a253da +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af5f02050f0afe27653d210028ab86f5dd4ce680 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d4ce134a9eb6fee8d76b8fb7f9c1b50a254ee5ff8e407d2b960ee80196d5be8 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_45_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_45_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9615ea87eef5aef360c8bbb7318cdc674e5983b --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_45_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:decb7b40cbd21ca5ea1cf33b27e0d989fa4eb93e952c10ea81e7eeb4cffb3f1e +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_45_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_45_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..776d937a0e2e614f4eb6427ce8951043b763b1a6 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_45_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7710950a082059d67ba017419bbb6ad6d78e1473d086c1da4f37dfa84c0867e5 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1146a4b82c7cc09a2842d31d46c06440703cb58 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c45def6c01f492b80a6debdd0993501e6c83eee3c768274fb8d1de1466e2365 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57d6a329ff44bdd283035a11c52958e0c0585111 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2d7877c609e017f03ed92e8662f9f2721b2d7e0f233ec04a82a5860135ac6e5 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_46_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_46_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94155baed06083afdcce2caa610b6e541626b338 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_46_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a6d553ac4eec9d5de698bdd89daa26b4626b8ad03b69a687534c50ea0da973e +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_46_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_46_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65285fde03e6bc08875577c63331e9152448150b --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_46_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0cedf91e243d8043d42729fd12d32bbd8c93553cb7fed7a8e56f4d274bb9340 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d568c301174d82aa824d09a105172e4ea4f53cb1 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:620504cba4ac6ad7e3df26ff3f631cd5df2b124c9150e0752eed4670908d0ce8 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30d011cd526d3322f8ab4ecd3f27574fa5973635 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02b5246c61826497cc2ee977f28fc724f4bf6314c552312156fc6b8ebcc6bd8f +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_47_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_47_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c064c07b808a52a437aaf80a6f635207835f2221 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_47_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2189733762120cbe0f6a9277431ad621c44eb5e9f90fced2b801d2097cabb44 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_47_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_47_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe1a6f927bedd6d61a7b88fbf96598923de2da12 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_47_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74ac210c395b9360a010f98203adc41e85ce02161f8f67a8682220ece44a6577 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4229ad1661d67de6db076163e3f5dff110a6286d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95929079424a00aaf41b64e6b89c3a02a91c53c75ec8ff9476866f51258fba5c +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a05d07f1896f56f946f628092d13c505a3585b4 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1b8c102c227c97791e23381e6d32767591aa4cd94ebb15292f513f9dc4b2729 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_48_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_48_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0664aa18660107c4d6135c34293c1999c852d822 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_48_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fec645c50c314c64a5a969056b2ed33e568484eb9f285b41004404cc65345e0 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_48_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_48_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b915937ee224c6958f94789953331d2ca3222a41 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_48_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c63b072535a0b450c5f9d696590e156cedeaea7e05a7f96e4b5182b8fc2daddf +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55a26684fced770ee7e3d2ee4b80db9bb1560c1d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20d78f8353fb6c72bf88b66102ee606e4fd22c8c45c44916a3b5fd752584734b +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b486e1c48fc273075ff89d468412641f4c1c8f18 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:373023ac3dcc0f087bca9c8beab1f3bcf90982e940afc22992320b617db3a36f +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_49_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_49_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21f2fd83be31bc24b4d5b0580eed02b4ff451940 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_49_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:640f406feed3e8c7b945f6061849444a222622d008256f696e3d9a13226b3dd3 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_49_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_49_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bf2c1aad2df9a9f71f0f3034df99fb9532ed5f6 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_49_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ae440b19c4a022924629a1a84b7617b03f999818f9a22c8e9397526c09dc2bd +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..744e7101a17fdf37c7cd547275985dc136189c31 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:274175edb8e2cf0ef9c044c2504755816fe4cf6301542be0b6da5e5166e0a937 +size 208731415 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73f271e820f926fe0e5590069cd3df743d4f5d0f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aad4099273be75960fbd610d795c4b93abed9c00f591af6921650d965fd89566 +size 208731415 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3abe234e3dcd1f791c8a803f9cc668e2ce3d90de --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93f645d9fb66a873070c60dede9fba8b6c5035e2001aea08ffb427aa7fdc380e +size 208732183 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f18d5ae741a97bc14ea72714e329eeb0f153374 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3cf2de51b7612ab4ceeadc4df2677ab9d9c019695a35b9bb8dc025b50db8d77 +size 208732183 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3710e8e5fa5a2739a4ccad3444ed5483c20d58b1 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7e12e5f21f4530d99a512ff2cdcd8c480fd7649e47142ac5d9dbb259d18e896 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aabfb6cb361237635f78b026a978e585d2a3449 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47cd7f8e9df04057311e6f7a06e7d96cc4b4c1fb2502dcde37a9d29c31c99df2 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_50_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_50_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02a63a16204652aeadfc62172e71db0be338253d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_50_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57cf97438dc72e031a0783d2235f8f00d01a36ae17618b092122c53965e70e99 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_50_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_50_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc83c3665166201d127e2dae6eb13a3d69d9649e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_50_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02b271fa9cadb8df7e9cb5a6822c1fd529371b420c750c03a9de146d35ea1436 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df5f1ee5bca991df5adc2f84f06138e7c5795281 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:769a5a4059849e9a7ef7377ad330c297dcda50e1c0d4d455dd65fb75b71fbda5 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..617ee0aee99c7b7ae456c14554573b1924cac0b3 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf2d49f021c29a415dbf3af284b0113bf46d1dccb80450b506076b03e2adc4d8 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_51_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_51_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cc3eb1508188188e100d98b3bcf76cbaffca735 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_51_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:782ab493cd297a15064f76b0d77c40ed6eb04be9c7a02ed9df22fe82c275ff7a +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_51_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_51_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f57f5ab07101b3d378c58ae814ec1a77ef20565 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_51_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03f0f9211d37f0782243549ab3e83f52f32da62367fe32cf2484099f36f55481 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3b36d711b3819b7b6c5a6563a5c07582da0b8bb --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a25ca21c6312bcda079c6e0b0d6a5cc8bab4af6e4df975d8901fb70e6343cdd +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2593496e1aed2648428fca75460b7c293691497e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e6a91ce325de566ceeaee4c335007316954b0c53654082e6f07e41ed16540e8 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_52_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_52_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b36657ba1b324596736d46ff1615abd98b6c2141 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_52_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7969a041b73598f0c74476ccec6c788e6e3fc1c37203b13d6680280e136c2e26 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_52_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_52_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..511b90fef1e379cd2b0fa2339daad2659c15758a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_52_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfbca7da76f2edf92ee95bfd196966dcfa1bf44015a456527bbea3ccc1b145d0 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16d6bfd17e3c779b5bae56ddc695a789069267c1 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a1ecbc7c9d84a1f93b88b0b8124947318db6695f0e58fba85ccce078925e902 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d31911d8e00e03c1e12d585dbe5d764ab74c5a9c --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:916ad3c0da9f2f980715b67484ef384047f761f1f75eb6075ad618edf942e84e +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_53_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_53_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08be4e643259c4f786c1f49a592367d8389a2301 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_53_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26daa6c88df03e1e66003bc5f20428e6e5209ad016fed94b1712f5247f89285e +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_53_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_53_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74ce7c27f64a584b0b90c00d669815337118acd4 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_53_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3995b37990cfff2448279384592968600f3309508cd4adf78275ff3d1342f40a +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..286169c0155dc73b1e6ece1777e9b4c9105fdc5c --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8e061959d8bd7b1e324ca5f63c6b939b75104dd101ee910ccbf73ebceb715a8 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd8443111ea4a3de0a61dab621a9b4f251df5ab4 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84d32927ca88ecd4eefe9e7cdabafae30faca335a2509d44323d781476ccf530 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_54_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_54_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09271ba51c56d60dd6fae70082ea2afc3f62cfeb --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_54_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6f54c89baf2234f22d0412f1e7ee77dc72c4507ac9c5ea3a5ad540b81830d0a +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_54_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_54_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94313c2833c79be15fb2dce4a623330091e421c1 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_54_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:917eb915ad357779a89a2edc4dcc9450ab91bcc4b70a850aa684051b7efa9d9d +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df6ed6418f8d26ae64869b8a0ca7acbfffeb3e83 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9ec67a69f742b788029408347910575c5b6868786663a8cdbec3d32edbb48f8 +size 208731298 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a31345a35936641ab1f70ad2c3a279af0ffd910 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5629bb6697e10922ad992cb590423f2c0ba2ebdbd0770c9fa8db2bdb2d1bf3dc +size 208731298 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_55_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_55_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58710eac96357af666279010da1be0a39a616214 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_55_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1db6982f12f571c037bb8645a857befeb19706741893bc8afee6878814f1d85f +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_55_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_55_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa76663ab8763d405e770815e0aa204be29e6a1a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_55_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:784ca32b3a0a9cb92f4b3a05baafab95c34c894549a68717eea367e68fde719a +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d29223daf4a80de7885c9d61120cfaa79b25abf --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42fcefc3f1b7059043addbbff7feb9249bca4a6ad38648447609fe9848eabf30 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91ec52ad633b549d0c51f4c63c30acd903598f58 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5acf6bec7acafee5df8b2a006c9e513a54cd494ee481910336ff86f58643d006 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_56_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_56_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4269225d2d80c780294b0692864cd5f59ec8a7b --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_56_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d1a899405d269b6dc17ea7068bc3312cc3b311ab907a386f75d543fd4ef9511 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_56_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_56_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8aed205680a5338825273e5b0706b270210863d4 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_56_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fd0bc706d9fbd1976b741f47cf274a4c0dd05c39287efb6335b7a3ef680b7ea +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2de6f77936eba47e35c5fc8141478ea76eed64f6 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed03fed98423e2cecc710ecb53f71d33976ff287854ad5cc05d17c3d80727b3d +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7476f0c7893cee3528d06aa8672c054b480d9b4d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6013d4dbfb9c3c1db0d1296e9157da63606e568ce527e9b46f19fc0d3ee9e6b5 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_57_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_57_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f8e14ffb80b587be413e615b3152a83d024efaa --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_57_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:196d9fe5d52dc83f6c2e3dfcb265a625eab6eebff1a399b9279c86b91ada8198 +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_57_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_57_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc40e902447166e326d5b1294474e2aec3d97cd3 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_57_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ff5976585e2313f77224d57d53412414ba6673968cfeb44d0e7416b6bd7d24f +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ed6331bc7ee7c91569b095ae97015928073ac3f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b15b6f8d081e5ea0ec6425e6b6e6a0839b40e87d1c2aa91889d79ba010b5ea60 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2b0324b7f631c9a52b0f4100dc2a119ef7e7461 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c13c7faf1c4992880a9e8f1d86e93bcfe4d592a78af338a9d1af9092ea76fcad +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_58_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_58_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fa95ef0c7b23bf4d37aa597ebdb79f6866f1cdf --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_58_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27beea80016b50176b5219ec190d689b021cf9edca5f1168cdcf204cda195f65 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_58_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_58_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98b5c36a2104dcf53a9914a911eadec3a7014c9e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_58_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7426370c9ad1c1c22208703001667d8d0f681a5e767a4abce8c46ce30a55e4c1 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9aac672986369338b6dbbf09e7e038e3ecfd3c82 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b858bc6cdafc3b1213d25891a11dc2ffdb6ccc545823c89da3004e9214243202 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c33edb246526eaa2c07baeb01770fd07645ef6f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bd48d28530417cd2c17d547b8f00c8e1705c0d4b9add03238e2f87b445ad24f +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_59_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_59_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29404a183820f6c979e3e3f8571ab44735ccb3d8 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_59_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d438aa00d558c481128d280a4e8d0d783a4257c624b3d2eab6d620568b405320 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_59_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_59_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2fa3182752cbeb4e6f420650752eb1b752e26f1 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_59_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:769bcecb21cb1d2491a3e4f99841be539eaef7bb99b0090bc16f6b38ef1eedd9 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9119d72c9f972fe6d571ce41e4d11ba3f57c4e5 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e1aa4e9e23de872d54d4060bb2e6416f69a551007c384cdef51f117de6f4b12 +size 208731351 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8eb8220bc8321278cd87ab654a242fafdd4bef4f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79aeac29f9ce0f2c33d88787a7d7513f1afcaf52ce6f2065d124dca6ac5ca19c +size 208731351 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4853e0204d5693e1a232092cd5b7286208e19469 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3522c56223f57b9232ef68d74b47a1b330382e4cf07b3d503289b60e9d63b5d +size 208732119 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0291c24a8f21295c61e38e25c14f8ec336fccff4 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4022e08beb455a832fef2226c7de38c511a9423e1d3699999afa88233934d6ed +size 208732119 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..baeebb631d3ab18b3e7e55583b58f56276cfed26 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0717c7a7afa3e8ce517961da6745871333ba16b0b525908ce3cc7347732891d1 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7704f21a28ac9c8e4f39049cebcf7454ba38515 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:953816bcd6fe0856a98e6cc47f367455e58ae1a6bdf7ac5c46934dc49d9eaca5 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_60_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_60_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c624ac4471633ed8a42839318f4eef3d1bcf14a8 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_60_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4016be589d55a3589779e09d639dacc860b7b73dc30447db8efcda83ac28ddd7 +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_60_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_60_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2e5721951f5fc5729f0ed21eb8d5e19481756a5 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_60_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d625b5932d660bebaa97a29b5a923fcc9253e192544471113857fbe5a8daea1 +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ed025a8b9e4cbb666cb64c80ae83e0c66126cd0 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:859f65d93c88e8a16637364993af07934ea23c400b8efde6405d20c99f1f8e23 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e7121d9db8efc7bd3346b9380a6b90cda96f64a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c064c0b2a0ad7a4ce5f4b08e894abf43b9b6196db0bd2f686e4bb372dffe2700 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_61_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_61_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9c529fdf2fe8451314eea0fdd1f452315dd3dd9 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_61_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f048b01a41d825bd12fd26b42d417c6ee6fe176ae3f26e1061940c12e381859 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_61_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_61_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32483b38fa807320b7f7b837e487358d64953d8f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_61_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55a35cf29e2a1962393d01a872df6315051b9b1e9a018bbf9f0445085497aab5 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9986176b26793b31885d08eb04b6e4a88dfc001 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dd204c5947e56546da007f6a3f50e6c0f1b5c405e353d95d7969d80e06c512b +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..243631966eefd316ff86bcadccfe1ba04aca9e96 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03a2d4fae328cabf24581ab4482f8e81cf65755893f8515be96c64fc95cb2ba1 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_62_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_62_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d4d3bf41789267fa6a1cca01cdfa9f5dade7b6e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_62_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a51ab44cdbbbf0c6a868b0644b4f81e955bd7adcb4f176b8ae8babab234319bd +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_62_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_62_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e71414ab34de0ab70a27eea9533f6d4cb2a5062f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_62_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:602f2568bdf1fc3b61d9f95550da352729c6ce49db7e0283b904b05aa86cb2ea +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..466401d31cb7cf9d08f6de304727ed5fb6c992a3 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:695a84b28d9caa2acb7bd1a1773271344d52350fa98a95877f24da24f6e07356 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8d6c2699eb5fd7aff02708dfdd7e99d4b7b0321 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feae03806fb5d71a6ccb44a7c38027274ed090dc96fb31ac3955a33b440e3c87 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_63_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_63_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ead5e4ff1fbf300e31326542edafdc57a1972fb8 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_63_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dcf0e9a735724d0c99e87e730b882ee7c17694f9cd41f4b1f8712136b072d1e +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_63_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_63_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..395945ab43bf455364444f9ce16e717f7f4b5910 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_63_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e97ec8a1e104b6667ebbe1065c49764a86c5c8a1cc42849f1e8f474ae982acd4 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6058d9d11f52a894a8058d4b8f28d94af2b32b01 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db6dee0f1277ccac7313c8ba8beced4172e2f87df2c7c36fd1892641cb237aa8 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13ff038fb217e3245c8cb89a1ae15d4713b764b6 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce4dbddf2fa86c70f852bdab7deb7b8c19132a7aedf36b83cb27c92c08597d07 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_64_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_64_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..52baa01824414562c465971cbbae09af4c5c6e8f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_64_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b87b94f4c3940777e27b046b01a9ac58d70e272371fa3a96afdc682124655832 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_64_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_64_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e238ffa00b918c42b05bda0d529291a4fc0c5732 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_64_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef47444256a71a312f608a01e4473e7885168bb96812a01e273f61a1022dab6d +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a501ca4d5adf5dbb8039721e214a5ff91f5dd83 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e60b4c33f016e8dfebc0934428d1dbad5f50d2ec9ab4238440f052041cfb3f39 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33d82c3853f22df7caa03f297ea9e46dbe606788 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e17670827f00af023f02462aace157924bd8e6886946984e44d282dfe0ba7b4 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_65_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_65_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbfbd24399ce2b7007ea92c0f2be46c3f63166f1 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_65_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eea8d313bf6300f3b76c3199131b174d12af562dd5aff092efc6aecf036dd923 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_65_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_65_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14edb668ab2e85b8c00e05916ece8dadd00107ff --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_65_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3d6f520de603b779c97bdefde57b32bc9cf0f3d8bdb450f11a5639dc477625b +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0a7702f872c0ff698e0afcb7cd9796324920525 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50fea20f9679f507471236de0f00c41d0bd4e1a0cbe320bd18e8d85e8fbb0d13 +size 208731298 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de9b70225b4690ed6f867d74c3840a5f82444968 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27dc1a59d8a07cf04d5046e9189a607df979f9598fd6fc32e5a8544374864ec0 +size 208731298 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_66_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_66_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97536d5e1dd23240fa26347d6b3cb5a0c72db202 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_66_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f52813125b635aa5d71f818fd319b217fae33b03367baa33bd8aca6e60d13d7d +size 208732066 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_66_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_66_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e3a0621d1c9819f02ca81fd0d71375eeb07ac43 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_66_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a81685531b12b9292b8ea6c1f4ba7fa8c1bfa4884d253a5e5cab7eb5befc4b65 +size 208732066 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3f77f1fe37222d8bf3517412baf4f7a993e0a57 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74115f77fc4a0eaaaf862e838c46b61f1db854f571f08c0ef234eb87a8bfcb7a +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f4485b115501be392cec95c45b558dd73ffb587 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a66b86b5817b088ae8e9a0f4634b9ef35bc09f9237c941a30fcf515602874f3a +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_67_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_67_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..590fd340f2b069465dcbe63d9fa914a718141730 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_67_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39bdd60c82da6edfe69057a2541704c8968ca08e9ac793b0949c74926d2c0172 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_67_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_67_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9b8d164a8442395c560cd53d9962ef273b6294f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_67_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a47de648ac800e0828d18522b45b77daac3e60592672527b4c1ad58de310d81 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f08cf9b32b3d4ac1fece53d98f30fc82ee73f72 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c28ddcd10cfcb7f6135b023fe3933bfa69b58176280d60042eb8546cd6398979 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f09507a78b01185ab4367298a394ac5764ef2cd --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:986e34c55e771b8bc999b61f09ec46a4b23904b8c168673469bc3656d765a68d +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_68_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_68_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80e87340a86558b82ac0f45e8995cae3b8baac87 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_68_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a878de92dc09078d575096fd70a51df85a552a9ca3784beba700f6c921b68177 +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_68_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_68_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ec32d5de7c085efec1413d2a0e9ef52f64fd9e8 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_68_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a126b892767df9fe529f42416a53cfaf19d41c305acd82c156df4f29de400053 +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78eb6d1187866f2a84718d8103736bf0b0436d46 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:812609f4bce0478acc2944248c1f03ac450c68f8eee73cab6728d80a785409f6 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..452ff3a3ec43796c0e35e263280a5e0d8b630c3e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8038d02327a47ac846e9c272c1c8b07ce4805d4de35b3e3ac3a8839123c9be0 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_69_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_69_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ade749ebf11c0979c1102230bc681f155a23113 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_69_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58a5671351df8a7750d802706367daab46d7336b9824eaed289eaa3421140d7e +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_69_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_69_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08a20a6e61f4924502625de71d3106282915fcc3 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_69_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:746f6c6779a462fa62be2f11fb763e451b6a81309840d1edd497c067f54e4fd7 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..851c12becf65ada82435d6b8fa9e10f1e3908508 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:458aa0750fe199a161efef4dee782f6351ab644c540e6042461cde36eaae3585 +size 208731351 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fcee6b4f1afcff6c74a84a14e966cc383b65c27 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1e51e1d44797fe9046849598b888a0a68f1efceea0a9f88478fb9d828259a30 +size 208731351 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..efa33fc065a0bad59c703583061d0f0e6fb46bd0 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dd2260a34d7c6652560e46e7dcc8a209bdf8fc5e4ef0b129b178ced47eabe6e +size 208732119 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91b3497c8c8d86ad33bb700018208b0bfe20fa00 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b719499f3cd8ba0ca82c09fd6249a8b31fc321c276672ae92f61b5dc4125554 +size 208732119 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7eacc12b83f07df8bb1f6b33f4d19678f0f1132d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e975bebda976a3a2f79841eb820792a0c887ca9173cdc2ed225523a9970a2f4c +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4ba7c289a6aa72a646ef5e7061133ffd5bc179a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a80f3a90a8c860220ffa877790b1ff13cba93fc1c51fa240746d18ec8d6bb48d +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_70_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_70_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96cec48deb68d2de1546f6443faccc39d0a0edde --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_70_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b7e33df6a1c6b09a151b7a37f4ff3da9bfa5036187686c901c040841127f728 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_70_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_70_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a1775540c34f77e02f82d24dd75e81ed531f3d1 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_70_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:598ebfd5dc5e464b82071b3dca852d75ab1afd532290b0017fba353343d8fe15 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..618b1074d67ac93b1c7e5cbb1a25e04d439bc4ed --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:502a6a60372838b5a9cc824e2fe6929fb44e2e7f6677d3feb3c649672734f9c4 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71736924298f8d22ce2c1e5c4096fd8c37e280ba --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:021db73a1aa0ecf1c56fcd2e45273aa255208a36da5ebaa196772a1abcfc44dc +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_71_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_71_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..332d301522bb280b0089d8ba6790ae160017f122 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_71_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96bf391e143badd10a6b007a84f32f4670231a890ade286c7b10dbf7263f20e5 +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_71_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_71_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a635ac1c6817a5dc63e71c363300f9b24500feb5 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_71_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf56cd5c6a4e256979cd2ae5d1742d1652149b9d3cf972a8b82241434e0e1c2c +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb957d85d426b2d38ec052ff489b01b23490264c --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cef4b714249d895e96a48dd52f03ad62139b5e4a8d1db3e56e07b15ac2a16e1b +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d126f9085be3c15f96710eda094bb9e9d7cc4fc --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0de3e4eb9821d488491d08ce1fb966ca400994e03fb87aafd03480a0dbf94890 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_72_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_72_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a52b23165a47c25cc6914ef7ab4d683ed7c7216a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_72_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bbe92da269c7fad6e66712bc4bc6bf474007f292d72e11cb76060c6d8326680 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_72_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_72_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1ba4b7874b782f1af6c2b0c0e5b35dbfc498253 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_72_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e519b06a3bea820c258d8a545fdaa1c730d9d0a863b98294a83e9864ee4094d +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a607131d16616c9e0492e736d61d8f5625983326 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91871a3dfde57ad1bf5b3081696a8b4e450858da84931017b3a2e099d98bfd62 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9bfcc873be40a1a7f02234962b7051ff97813d5 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bbe5a9dbfe21e72c9ec50e9fdf2c1a4f228ec20a242c3925d2ed025f2ead8f6 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_73_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_73_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8714bc6c58cc85ea7c08da3beda8f0f577015bf5 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_73_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5e50a8acb1f6cd6f18772ee7e665e0ff92877bf4774acc00bce69fafcb040f1 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_73_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_73_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f4b1f59dcddf1619446c8daf3805b55691ad4ba --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_73_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42fc65f1247b0d26f20251e44124f000c5be33a4092c0d8abe8fe77ae45d6365 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa5e2f90aede9c66ee104b24e08e6dfae7452668 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fe198cff927ec6f9867c29d4dac18a2ffd490e743035293df990b6713442bdf +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac6196cffe33d69edac4ff283afe29b3203dc921 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0be41f3cff445dd7d839608a56ef94f934ac2c34ead3e65d36d1c459bd9a8b62 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_74_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_74_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0793f5f0459114c10368c736a4ad0a5a67257a39 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_74_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d2dcb855e0d1ba42927ce78e5f02335aa30067a341ee8e9667e4d864f3ca116 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_74_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_74_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8e82c833696e85a0d0dbfb8ddb8617e2d1c7a4d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_74_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4e3a8f2e8a53cf2f7bf6662e3103ba30633fcf4d57f3e0a76a9582a527670e1 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7396d8326875906d9ae65d7ff541acae2ee5808e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55f79a1915defb892cf16aa548e0e451d121c5e1191840e3c30fab163db73c3 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34bfe53d4b7413551b4ccd9e913727afa7c3eddb --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4d90010bac5153c4a023f1059a542a9f13f6a4e17db59917a467af31be2ef16 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_75_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_75_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..479af8c3556eb9af81edc92f5458c5401db9dea9 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_75_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89e59d757f6cdc7c8844426d9c616f88c02f9516b438bc8c16d3b8a97e35e72e +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_75_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_75_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9102c88495a93799cd5d54b16d056595a81a3ac --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_75_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f070f5601b9a898c2defa4bc5a4e6ee3d07f963272dd3ee302172aa21408a643 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b27efa4fb5e0fd28559bee4ed7f96ae4c37c118 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8343d63da35864cf11f70b68bfde80f3bf1d87ef790d5612552a955046f3059c +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d393d5909e81441441ac8b9cf25438036fa6da49 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:614a6420b0084247854f8e2d2c70c81edd87cbeecaa1d91f396a9dfa30125c01 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_76_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_76_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bd49be08bb9ede64e4cfdb3c56d1bfe6b933c37 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_76_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d58ca59e6506b2390fb257e8609bd5799fbced1c6325b24b6d9eb8faf049756 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_76_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_76_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c11c239b22da57e0d47bf96885837979e94c7250 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_76_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a52589a32584db7c154a795f2a7b4bc260a927f11c24a225d0cd9fd8030fe0f6 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d8f8571baa981e37066ef517198289391a4e1a0 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22e41221b69e7f420758aa29b293ac76769a7d95250985fef4d04e9d8760caa8 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83b6a8048009e5d75ff57b9dd108f29dbcd11637 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9cab53c01999fa8c42e30ca3ea25178d6823259bb49b734014de01851d324c3 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_77_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_77_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73c1d98edd7f411e8b1a8fb071dd4b7d79b88c5e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_77_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c9385b9af54cee56f368605cd15692e9a34ee5d100210db4615d9a15eb2b918 +size 208732066 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_77_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_77_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..311e710300da4ab4583ed168d4bb66ef84589045 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_77_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f8a87c7ff159d4932435dc9b2c816c5ff429621c47c3f6a056d1e2f5dd9f6fe +size 208732066 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d71df769a6e515909e35ed35f7f4612576c78b18 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74fc80495c2dcdbec001358d3a102be94f0523aabbf290ec3700c6bc4d8d1832 +size 208731298 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23abc07a3d4c979e4357f760564491ca528a9f27 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1627dee29568657797d02aea323984243c4e2898e7e5a80ba26506a5ec65bdfb +size 208731298 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_78_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_78_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2bda8ebaa592a6000b608feab21135dc2f0909e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_78_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e2e17faeb5af3d13ecf71fc6ca98084dbb643a254898543210308d293f63caf +size 208732066 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_78_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_78_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf00c8a6f22a6b642932ad764f86689e6eb9e89a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_78_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4272897bcc3b39c37645583efcf732ec29c280f31255da6fa8bad4bf2d66056 +size 208732066 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df32512e704208d2a8e506cde6f5120d21cf6aa2 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5b6ad2d07cab5a12a47fca26d4a48564030e581344bf53bb29d574798d68825 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..594e34a5df72e5a22c5f4d30646d2a52c008a602 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6f1c88e99a11577a56855d705ea74f2c64d55f16eb8b3da47266263f9bf37da +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_79_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_79_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54005868ea3ec189bedb45dd1afdbad07c641959 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_79_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d5b32eb5be8bfa99df95912d9e7e5951850be1cb162f9270ac58b398711a665 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_79_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_79_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdfa0e73a6e83c0f1658fe589fba387a2dc7572a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_79_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae4ba46b283caea3bdfbfc79422895c82f75f426aac39d2945af8bf29803932c +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..758859eabca540cd2d60312c6326854c9d199f47 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d619a064b66794837e29e696af1997bcff0aa307c50a480a1ecb86d7ba66f7f6 +size 208731351 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73802f4c65bc00e0e6e2ad78418836f60b7db939 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:186fff6d107c105d4b51c0ebc5b0884ac9d50ce7167705ceb6f6da0aad54d959 +size 208731351 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1f3cc996f67a3f0de8c3ea3ae1aebe8065a8b01 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da906f815d19a6a44b1d266fafe8970c552e3e50893dfae845959693e01d00ad +size 208732119 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53f2460f165a77585b44a85e8536efe96fe2e42b --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0c63acad2509cbb508635693612f8f2e349063e4048605e2194406e2d503e8a +size 208732119 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd532c42f945b535d2d55100a135ef13c04f546d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eda8b7a5ff0b0e3035fbaffdbd2071b8b7f31b82ad7d2f721b62158c059211d9 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e6e8593b6118d196187d9ecf9e76054cc3939b7 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42b93f4ac56138c3c8f089301c38b530f47018950b666a3b8a7309f6c5fa4c33 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_80_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_80_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49542b302524536e23cb5ac8dd13eea0c7e6b7ac --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_80_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb3f89c5907d4b00b1179a0d3d58880bd743ac4ea4696a05f0df3041d9de6d15 +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_80_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_80_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7e394295b56268e4c8998cc51d176560c395eca --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_80_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8cb3e86e550471a293dd5e63249770271cee1893829163d17ee768b938fdd1e +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cbac935e4b33ea101c1989bbde31de5299c9a79 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26fa000545d7d926c121bafd7c93e35971411d25afa3f0d20009944a879fc472 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39c61effae0dd2232fe683d3cc5e90a6ac0ab869 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:588c86206f147085a45134dc467ba5116af2bbb1f65b6c4cdef5c3d60b9d82df +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_81_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_81_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d22ecbca06a18a6fe466b3804b22fcbc92f8d9e7 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_81_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84831f87b3356d4ff8d981eb6038af036da34655ec5998d9b71833b8a68ebb7a +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_81_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_81_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81536deea4fa6955da4f19f655a1e9423d73df41 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_81_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:148d79dca2198b87ef326105246c8e2a618870c8fa2d25d1d5e80875c31418e1 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91c20ba38a2a2a41c84dde01f856bd96d61553f3 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c75faace9ecf35098401f4d802d175dc5d1273fb51fceea3a2ad991f74c07cff +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cc0e47bf51d1e8de7a5cab3a42bd8777669fd51 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7ae763e92a412556e10dd6d14158287f4f429a45b630671011eb683c7fdd501 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_82_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_82_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58b7e1731c740e1e86ef3d52ffb4cacf2c87f08d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_82_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d71da547c3be8689acffb10dece33f2de2ad67cb42e9c7d647c4178388a90017 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_82_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_82_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fde968c32260fcd95394b6242fb9888286c79848 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_82_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e45ab87a13252dc8bd62455abc4ca42d1d6bb141433df2e2674bae92527b09a +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47ebf1046c58f598c95992189f02081514cd8168 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f73029ef4f7382ac963a17f02f5a319b4e1e6f824773edc63cfcfaa3d7d03555 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06512e70727d554ade41ea6b4edabf3371ff12bb --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8641406f2b1275d31b764046bd482cf74bad70da5d1bdffaeaff60308f97d181 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_83_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_83_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9698128e21c3b003107eab8f390c443474d7a38f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_83_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:310b58bdbdf1a2f4e7206b75ad0f9e0b833888c13d36a686ecfa472df71e8f78 +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_83_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_83_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..254643c8e0c6b18392adb6df649efb1e3eca5ed6 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_83_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5f680d1fb675a47d6c48ebb76f719abc7387e5f6caefe070dcf2483cae0cacc +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f4446ef40a9b9633e21c045bb7bb31ca5d15482 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e174ae2487e83865f645b60470ec84fa34beac624add892c45fd86a5fe737568 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd61abe91f3b765882260d5753d10b24daa67970 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18d1c064fbfbcb10bf8ed2afa7d5c01a10e6acdd892d1c5373ef7eda1f50468c +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_84_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_84_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6fd56380f463ca371922a502f5d90b85668484c --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_84_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a3e999a0e7f15dad536e957f11c2d08df983d4487d4619cfcc9fbfacca86a7a +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_84_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_84_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87de6d1f134bd8ba78ccd87fa5305a02a38e2ec1 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_84_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be6ed94f4472169ef1d3c2bae0eab48a15d390fceb87259e5ca9d5cd394ae6b4 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..123015e975e5a3984470c522adb1645a775278e8 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6c150eb1f4c6d4fd794daffb1194a17c47050eee5f57d6c116e50fc122478c4 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a440b370ca39ec0bbc384a1704438fd5791dd6e9 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78ea340007b18cccbc318f9974b8248be0c58188d2b75b2b5bd208691b021d63 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_85_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_85_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..098f5f2bce132fd3cbb3bcecb62a57107ee683f2 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_85_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f3fa10b822029773b80def29873236ffe941f140c75a82fef5d1b3c86a32a01 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_85_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_85_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..041b14c167e6f56e9acc863d71d02d74e39b22b0 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_85_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c51e748dcc68ea1d97fa4800f7774f5738f5fdb8b206f3579dca54d8e4e1702 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3eba9f3be6d22e78d2248c0c78cef20723918e9a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb18e20a5c5c6a45ade7b32ae03b1e61c470cdc7c2a085971f835b2dec7361ca +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eda006c987729c9ac9c9f2b3c556a1990e38bf04 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3cb0066412c2f70e5c577b04ba17ce5b461e42771fb14b691f64e3fd762da32 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_86_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_86_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc4b76294bb3574bcf58fe7c804f78c7ad23262a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_86_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a064c825878fd93139b8ea01da0355563334bb3bb7781d119aab38240c320beb +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_86_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_86_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6814618a8465d4bdfb663cdadf80c021f6b89363 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_86_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fd013abf0083e11aab7848f0293228aba1485e47b85a5bc5854c2dc10cdd61f +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05a0926c2b168d4515bc462b026afd40a52a0a15 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac154778a13cc6e0dd19d2f01479bbdcc4dde58051171d9e9c977b98ef8286af +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e1ef46a7c4cd4aa50b4c1281fe4173f3cd542c3 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7546c7bc09e691cb09cccf513faad722de1bb5fb4bf5e94e24f89c0556ebc1c1 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_87_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_87_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbc0036a839b1cf3d67df4f1d68ae2c3b8ed3688 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_87_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa8ccecfa27f6b854272b7f1d734f7bb38dda152d4d542317e039c00e7827aa6 +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_87_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_87_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4ccc1c83ddb33edd4abcb5b6503b7d4c25c74c4 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_87_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f0de7cd758ba9b6101e4a8d0649ae64d98c02d98eb062830bf7ade602dbb9bf +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66e5848b6c6f5307c9ad617566d9b3faec60adc9 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9ec2faf8106f32d943181861d9d804321f59424ee5548fcc1df38d4dc5a7db9 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d8b85b60bb7c7cbe051fddd132ee04d1e34600b --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bf2825c4da0c391a291ba0557024edcfdc496e3ff8e40012510d90426d2e1b9 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_88_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_88_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dc5cf8bac60344e8369d478da3823f9a46fd467 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_88_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59c364c822349123c883c55b0b036e9a80a6ea16b81633f236e18e3ab35f2b23 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_88_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_88_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b31723cbffbb158a930f4f33820bc5449076516 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_88_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4671ea2eba8c82f380338090f18be3a42fd28cee3c71f57e3b0c97312b9a8fd +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe01a5216077dce71acdc442da9bd62e3fbfdc68 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2474ea07800f69c7d133a97738e4b22cb616992b6f0f816f0831c6636acb4088 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..625fddb0c886c8c2686596eda058462b734a47ac --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be2cfc671210c017eb1057372f560a3ea3c76d7d3ea53799613ebd0e7b89e6aa +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_89_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_89_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33ea621019c599b0d57979e5c0f04ac887ad7039 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_89_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:319b40f2273c1ee208e6e79fedc1c79a363f1ccb34e4727f27ec4024d8f07b9e +size 208732066 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_89_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_89_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33c02ddca21e0911e9dcb4935e9fe55389d2a4a9 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_89_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f09308e98550b4a8318763bdbff91d7c38e1c5de65e4354e5f8e474edc214fb9 +size 208732066 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a53f58d1334c6761e6f89e71e5bbedb5c4e3299d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:578f30c6a85f878128964e4b25c1af2b2966b27556afc32f9f6011512bb01101 +size 208731479 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94267675295bbce3c47be0dd633c8954c9f42609 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d131ac12e1fa431706184f0a39d098fa60007d62347c66bf37e365f8f591264 +size 208731479 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f07cb1bf7841dd3cf4332cfad386e8eebc364121 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5776f214812cbe968709c955063248dfb537c1a370ff7494581f3b2eaf4123a +size 208732247 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99c44128e4eee6b408ebee1b65e8cbe6d807381f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c17cbe4bb7c33420efbba1a4c674957b807e1fba9592f17d088209793acb0ae +size 208732247 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48137ece443fcfb9e28b2cf869fc02b88fa6c9dc --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90a8f502992966c0b9b303c2735d0b91784f48059fa94922e62bae5af55ab74f +size 208731298 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..182b1ef62a91d3935c681ba9bf59b73c1a29b541 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82c0b3b3e4be8c42c27dd3af7ae63f544e31c8feaad09f0412c9f6e29ae4d1da +size 208731298 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_90_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_90_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbf90a14222834dee67cd3e9f78a88e0eee9f482 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_90_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db5e8a7d3fa5b324fac27595ccd301e6837a486181af95701419025a3a430001 +size 208732066 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_90_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_90_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a840905ac26ce46b010d6fd7b0a4b178abd01256 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_90_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41fe3ffaa352aa59d244f1c1664bf696abb3fc84ecdf3c1d941c3750ec24069e +size 208732066 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f9797ca9641f044403a5fbce26847ffaa95e552 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa5451ff95dddecf28dc94af5d1efdf923d12a0694d17eefb608dedb8eb6fa15 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62ce3ab5e3af7745eb2d88af7bd8b94139e41d9e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abe929a520860c549ac2e51e357560dbc7cbb30b4be13847ba3fd13202187ed2 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_91_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_91_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15227ea850146da902dfb7844594f0ec9833479a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_91_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12d875c473f70472de632a5253822254608279aca8028ef2e9f1201647288246 +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_91_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_91_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b04e8a2440673f8580286e0baeb2eaf42f13ab6a --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_91_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c050ab9c758737fdf9da2531825c8f333578e1c89730c3ab4a0b9dfec134a03c +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d6e010a6339e81ab69b21a01b938662da13cd09 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99105b0a5697308f9be124729039bf6836084e47e59afe7f82836a468ca13b14 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4953652958505f3b6c57d78e5b35d46e46af7c8 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6549b6aa9c66240c25269bd346d082e39b6fd681de1d85f53bc9c2f5451faba +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_92_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_92_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb49d760a9c58fae849c0a0e95a161b23f3f3b84 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_92_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd5c215c5dc1b7f41e006f5d6dbce7f9523250b4e6616d26bdd0617529f35088 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_92_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_92_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eff73518e4c03589b42181d06322819bc174127c --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_92_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b4816d441d90da3460138f72726c397c06a728a4769a9824d679d7bc764bc52 +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffb8b67b0a648e4c53cce8b652e87c73d20eeb70 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fa73f22f2597e0f735772d9dae4ba84560d150cda335d4f8061a3787ecfa690 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab6d242aa781556cd6cde7ce63f183e7904c3d56 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e719d21e8dc05a96a2fbab32b033a5010b8b7bc1494bafd2c014648079f218a8 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_93_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_93_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51d83dc9ab2dec612fd5073b973ea0cc74c52db8 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_93_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dda29e612900c9b6102343dcc3e355287f65a2e2fabef1dc9422ebf6caea2899 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_93_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_93_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06135762f683dcad676dd8f95e8fd1bed8d57995 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_93_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b53caab058b7fc0b13665fbabe80b67163d8d6637fc77b341c8fb74a9ecd7a4 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cd225dd7bb7b40dfb0b3b83a67ca5596fbe5d9f --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2c3ca7346a2adf17a31ae8a6b4a8a1de1414a9f0237c393b14884ea8cee5f5d +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd7f793b0cd9d8309892b941b0015095abdebab7 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c028b9ae4331cd8e99b0e93db1a0febcb204fb35d2d42c87938d37e4b7c21cb8 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_94_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_94_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f16ff50e12dafe4e6461662860d4733ee15473e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_94_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26f4d4da049ffc672d43135b8bf63998043a77fd52ffad166e2aa8ec7fec6ae0 +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_94_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_94_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0ecf793e3bccaf2a7f886f3b301414030efa3c6 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_94_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a0639cb0a7e124f3108a60a16b3bd2f11bbd7682eefe88ff521c7d7cb2450ab +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cde1f7811105c2853cbb89510a6efd4aaabcfe34 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f54dd433dc94db808312a3c7b1b9160b9d1702d6a43ba9d734218bfcdc27df8 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df401795d62f79fe0596633ac80a97b8249f3e40 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:391d56b9911568270045ae85f3b68ab6a665b0cc8aa4403a056124d93c409980 +size 208731490 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_95_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_95_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffd5e8d871068b0e78a256f1a295b46a18ca688b --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_95_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faf44cfdf2edd94bce2dc4c212f62884bc36834062921ae0c8b5bcb41c87ad8f +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_95_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_95_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05a38543a24309fdd37389a820a8cbd2b799a467 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_95_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d8d18367687a63fe3b18506a118de69c27e55bab6290bf27b8c8a59a5d87a21 +size 208732258 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb188c5442c85ea9e78b1cface015a638b9d1e48 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb875ad8e2f4254a41ce1d7ba8d14b71e4d799e63953cb0417edf660182088e3 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..834d93b934fbec3102901ca9aecf40611c79d16d --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80c03db342ca9e680f2c7d1f882b6611c691baac4e3eab4a244507a4766557d7 +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_96_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_96_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3ec7471cd45876d4fec8acfbc2afe37e9f43c02 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_96_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94ca6b012b035cd3f0aae186aba424be7f90b27ddb17763b14fdf1afe654dd1d +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_96_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_96_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03b870ac99022f32a4ee8cc990abab4455c0af3c --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_96_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4466830be79c425a3268afb258cab8508bc5b376a86fc4ac0d68243720b4b861 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22432828a5407d8fd704cf3097c1e794270093ea --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7ddb579cf35cbd96c5cb49a843efec526fd27a1a33c8b6f0d9b9aed4707ae9b +size 208731298 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cac510dc45e959bf0d4c1eca2f04be130f5afcd3 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4128d5ff77d2bb79d523dcc8ecd943d8c2b313a515298748602c9580d87e9f66 +size 208731298 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_97_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_97_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59e7c9f417e12e8afb8ee2c13e9e467baff70eb1 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_97_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e478f5b859601132edab952f1f78f768fc693cc8304500e905db81ad7ae6fa7 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_97_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_97_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8904e48b9681b7282fa641cab8f39636f1e636d6 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_97_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c6e0d465d71480cd25fcffed797c5aad7cd5efc99123da624290280857de889 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a6a52529abf6908d12c79db267a00b7d1e411d4 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5461530ec0262d44064f603e56802d369cd14fad9cb98e8ff1d278a889586c0a +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eaf58dfa78b52f4c5daa6eaa5e5e0e1a25de91b3 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c4a9568405c3660d2c9c6db3d9e902e48447c22d64db35270800eb945b718d6 +size 208731426 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_98_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_98_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ffd00282f1bf90bb66a0ff5b4bd21df8027c7d3 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_98_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71c5448e03dd857fc9e9ea2847484d1145b92db3779f6d8b5f2855dc1d310dfa +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_98_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_98_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c1023a7b1da261dbf5d1651a5cc2cae4012aaca --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_98_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:272bd1010c9ee4646110e2d2403161f8b25136b15c055520b00b0b8d2b7d71ab +size 208732194 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29b12ff43339392f3a068284d16d8512fc18b722 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76e6ed38e0bcfea609adcd24d14fd61a269b48726a487c9a5cd40c473671785c +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8e562bf61370d8e08c7437d40b4b172a72bae61 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:207dbb418196edaae344e580314a5a5c9c2ffa6848f0ec949bb234f8a5a744bb +size 208731362 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_99_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_99_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35dc9c72f7680a1adfeda811cd3fa2a90df2a3b4 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_99_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:700c5fe419dd4ee8161c24cdfa0ffcd411eb8aebc9cc5ce41643fff2f1c062be +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_99_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_99_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1df3dd8ffcca19526c66d73dcd0e3cc138bc8b99 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_99_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0df0c357b1c7b22d06381d3ef9641864a52776521c583394da06fdf23e5c8400 +size 208732130 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b93b72898e0a7451ddaf79c294d635aa896d8fde --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:090c925e85c2216fdfdaba59748ba0365e7bf9ba92a250f7c1717466606881d1 +size 208731351 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71f6877c35f0e9d88aa9a6829f9e37b1b047c431 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2d8f9a8de0695e7dda097873afa1cf6262aec561dac87fb2fae8af4d0fdbd43 +size 208731351 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..475d334134267a5ff69392c873d4e65ee91cb282 --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cf0f471b3ac90be77e9f8b05eb1b202ab4ea481903294435f06eacc34a84d6d +size 208732119 diff --git a/8b7178b58b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt b/8b7178b58b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6c1deccb31f0210e38e0afb85d48c41f3aa1c3e --- /dev/null +++ b/8b7178b58b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1e7447e5def7ad624fbacb3a38f36b9a140c4140bdf2e5b23362dee4c23b857 +size 208732119 diff --git a/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c500f1d59aedd0ba1dc5efa0239812e8450e48ab --- /dev/null +++ b/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3a2035dbea144f6d6f2197fe8151c0533e13b0fa8705558fc7911f0227ad5c1 +size 223347971 diff --git a/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03751f59a3f268ccd98ab7dd8ee69da20790660a --- /dev/null +++ b/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ede2c88c6b8dbc295b1fdf41cbfd77e2eaea315ca3040fcdf74694736d2dab9c +size 223347971 diff --git a/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b60d09b7252483e6b8b9ab706d27ac825e96b776 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:608f2f9b0129112c5d74156ba1cb1b269a99f2209c29392e4f4609ce44ca50b5 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..311027e15c95548ed8b3e6f9659a671b0f69e89c --- /dev/null +++ b/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f8e34dd8683f20dda66ffbc02e0d7040e966fb94a15eb572129bb822ea1752d +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebd99afc1625246d86452852d7e9769275768fd6 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bff834b3f67c05a884a117f7aaf4e2dd9ae56365a267a415c8200d371dd16f75 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27a5f79277d52078fef2bae4b86b0c8123253f23 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da18ec7a987d7476141d507bd9c70b38fd8d2c0e5fa2eb01b65401c52da93451 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03b936336d229c82d03627a3c6e5ccfa7b9d3277 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:212c46ea354be613227999a8774f03aff9fafdbdf926b33156c81b73a69fbfa6 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a57260290ea5a38b197b039d7b67906cbc3da0c --- /dev/null +++ b/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a29e6c81368d4ddfb0c7acb3b9a1c6c7070182a96d9df42c2edf3dcb0e570ddf +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02de18f9681f9fe8fbf4548c39a61c7d7c752b74 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41702e038a5e4f0df43e4f8539610cffbc294a29420124dfbba765649a052dd6 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..035328c9829e5302755f3db3b299fdf0e9636065 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8525602476bc964ea177ef362368e09d2cdfe182dcd464ccf4b70eaf43cdd9f3 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91d1f2788e8064e52a3b288714e2ca2eb44fe3e7 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08ba17136f4aca6edd4ec9cac34a30a2b7160bd9746d7d56222cdca5e1a5f35a +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f390a2097babe98613bc714baa413e0a5d258da6 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83be3a9d1a238d69e3118008e9c5f528b0d9ca98d2cb423f7239f1b9d8853f63 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f0f64251a15eb96d39b1cbe3e6ccd24ca290a14 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fba804f81a57af4ceadab5e4f26a5dc3e8f13891abed0131e349483ab01d0f89 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e87b5e6a895fd754814b2be6d211509dc9b0f07 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d7c2be5b020972a56f248c8b491a8f0b880323a00886de3ad95c04822510b44 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..858f133152203df1bc9f1285ba92c5e64e0d9ffc --- /dev/null +++ b/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2abefc8a90cce24a9b8bcc2d7b58b964c9264e874e8f6ac8d4cc3354b297beb +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40a1ffdc5f22b255e263ccd763288536948d5c9a --- /dev/null +++ b/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5fdfc0e2a4f54aced1c3cce3ea19768811049d01a4549816ad5cfec92ea7969 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..940afbd9627f7a0d4501110345429028f960413f --- /dev/null +++ b/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d56dc4fa64ad6467228b44d7e9b6093668cebb7d54cb6591b76711139f34dcb +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bed40f21adb3243539c76dd6fe98f425c5ff3c8 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c21052eea6749f711391173679b76c35e551724b83e05a3c7900e26817e26c51 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..958a42aff7b90202b03b1501e96aad45dfec5e95 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1dff1e16118a242e4067ee38a1dfe549a3b18e099e52fef951fa6dd9e4e74a0 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7c7634f803aa84a587d5c86e0f787b4c174dd1a --- /dev/null +++ b/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c42a532a9f44a4a786f9c37b5770893b59186210d5d2d7cd5a80f8a97008b7c +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..872207b501155ce7787b106e4a8b7e92e217bc2a --- /dev/null +++ b/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c41bc3f45750b51e5f76feff6ad74844ebddefeb3258064330cce59d05b0cab9 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18eaf6543556a7bda655237690ef6579efcc3ab6 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d362a4dd28e7cdb760223310a9df4fdd82ac34b0272e0daa8e66567cb40d5ba +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e416f583b20e7bee637a2e2043358c0b7477b6c2 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eb48867d018430d7296085b84fbd4fd3ff881eaef42a31443d8206c1313f5b5 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..312f3c93947f4f459dfb560dbc58a0f4543d352b --- /dev/null +++ b/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dd1b25714e8a67bc2af293f90d21d2be72e275ceb0918243b50401e0d47a017 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d3748fa8a7be77de0c8568a0000002822e63c32 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc88edde137b0d0296ef494937973d43611aa9680c5643f15d92f6885786a67b +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..154dd61e0c45b09be482342cf4fda232baf14392 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:452871462e9fd614b5d8b60d2d0b9ed6aed7b447278f8446a870124873c504e5 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d812455090afae3e7bd1981bd8623f1ffb534ad5 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a41296c808294e98c5215ce1575973e78c4eb4b5a9d702aa367092ee189d766 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e745390ff20aa05696066626145305002ece828a --- /dev/null +++ b/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc8c024cad87b39962d0d477ac5af999f09447b818aedd4da6c91ee1cc2986f7 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89639c97c3fa44bf89c3a02a25b8df0d835149a9 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8144ae182e6f72b5e0e28f115092b014117d9f985c567716747d2e5491f63225 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8f78dbb68a617a1492ec62e913aef5aff7e60ea --- /dev/null +++ b/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5327755ec932f5655ddcc961883c29e334b27702273df4371541c27a3add67c8 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37deecdb11a8fb61cc9bc3135ef048625df3027c --- /dev/null +++ b/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0223e0433320262da2d5f82ea0297ad7b6ce7b67ad39dbde904bc1e5624335e6 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ac6e5220a175541668848d0035e4808111a31ac --- /dev/null +++ b/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60df0661348534976bcd6c5416085ed611b3c6c792a46bec798d2e6ce92bbb11 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0b49536b831812c134f8731bbaa5f1116692857 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:819e99e97c83afa37e79f387349202cb49329081f6470fd4841f3713280d9757 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81f58d21191dc60ec11eae19ae6844f4c45ab76d --- /dev/null +++ b/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:269c85edc49596ef1b0c582299ca11dbebc6d198cd1a5ccb0c12f5c553e989aa +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90b2e3588c1817540186c98a3098693e1201ce76 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f55319300be159a4f7c120345420b9dc05b858564914b6835712878578dd4d9d +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dfe929329ba8f7ce7408d83b130b2f83689145d --- /dev/null +++ b/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a0d24e20f30f355886e03725bcd93b47a8a0cc14a2d1d07dd599678d4aaa8ef +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91217ccc333ea478aac1f37dc9e34cb3392dfb1a --- /dev/null +++ b/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5048b98ad823da9d9371aaad2ce612cbe704c36363d7b0c708d60e1ee5c04d27 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef9ac8db88155b7878b943759e409617832ce7b2 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:250b69eb5fa6687655a0cd0333f7d569c58ef47844d8786a6d009cabd074712b +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdb228e497a4aec9c546c75ca6a8cb0fe7703d2c --- /dev/null +++ b/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0615f9676fe8b4fc246ea7bc6013bf2415ace9f15ffcaf0d6a6c0e6921dc39e7 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b72998c6b1d90497dc9e637b3d5f88fc8997dc8 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d527f2228e4a8ff814e35dbce7dd72db105e53f04a82ef6f37858f21bf17f6bf +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d64a2f3481536d171b3e6fc091dbee969a2aeefb --- /dev/null +++ b/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0042a0bee9dd759644423045c409d5aa8d218bc9909af4a2bc443be6b04ce504 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a94ed8e53f2fecdc98c87eb034cafa4adc28f4d --- /dev/null +++ b/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65e898c99a0eaf2ad8930a9b35aa184693cadea376dfccea79f4b21f9772addd +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a756897fae4151b0f6f57ea58168b62063a118c --- /dev/null +++ b/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0be2f40226adebed77e3a903c758b8b5e5489048c35999bea17b2eb8a817940 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ac20850f2bd0b69a6d1befdc9e13edbf4775c60 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d0c50f9fce1422ba54a677fa2df54049b6eecca133c9751914961d39c47e884 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b1d150edba571c4bd92b14820396a404e81a54a --- /dev/null +++ b/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f600739e5ffd70b9b52008aa8319f10738c0b5ebf6618423613962481929381 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc7c30cd8ba75832c799c55ab81fd99877ee677a --- /dev/null +++ b/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8e3f2c83f1a484bd0a96ac74a482fa577dc5d6628b7e74e9e750951e69116ab +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..035af657ac7d77b65fe3648fa7213a9df82b317d --- /dev/null +++ b/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb79eec98bb8ace5a393d5d1a31b423003b94ce9f29e0b083752d8ea53f3f7f1 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0894e7f5bb06b162292baf6bba6e722cf6e8d9b3 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82096215fd04d7391e7a985e95765a8ad3cd1baf67173e2c71d5f5a98c377d56 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1252c68ba810c90112ea2db67b2a6a42b05d8004 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a33bccc629bfb1069545c25fc1b2774af178f0d0af922c9c5b7389fdf525f8d6 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bed9487c8908af0cff57b46bee5a0e641bdcd77 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f1ebc65f314749831512726bbf605ce6dd505cd348b9231e82fc94d739521d9 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..137230faef423f58d87f3a7b19a8e09a9d943972 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70af72960d8f6c422a59513616f1725831ec932dd6d66ca5ce18f809d84dff55 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9c27f1a8bd97ca7d660380b8342a45f769752b6 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:100347a837d37f6527717421334e62e05b8811aaa90a4dcb224c46b27865c17d +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f502e840aaf9cc2bca76027db7defd17a8d064ee --- /dev/null +++ b/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:386d48b0d237a645b003134af96f721c25893032b109bf62a6582a96e4303bdd +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57a59c32708fd961f72a99f3fb2638748f700aeb --- /dev/null +++ b/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa8a64e2d22254eeae19555c5a9b5b9c731a707dd4aded83dca6e8a4409de4e7 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64fe74dcf451d03595fdc7f68b5f812debff8c37 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a7eb8507b5af28d88821b384ef92d9a6391cedadc91f0d76717445f5d3e566d +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4be269bc3c718383f76ad946bc4797e580dcd13a --- /dev/null +++ b/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7f21a06c49c5c533fb36b092c593f63da7c8612443861457ea5e57148851222 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5860c48b359ae7aea8c63568970a89075c92c32 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddc0a71081a461704564626bc7e27a362df6f62493105a89c5c0e30e2f8aa030 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab4eee718df8b2f0081a249381d5bd26f6b3cd1f --- /dev/null +++ b/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6a05a2dbece574c65a4a544669e5f53a182e6ac840bfdb25da80321638f7bf5 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0563cc939626f221d592c4ee4837d71ee880c3ff --- /dev/null +++ b/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d98f1b432e72d210759745b1e2797f0ac4a875c917608d04dd6db8c7fa0e879 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5253313fe9cfaa3e7876c66f3cc39f4ff53ba6b6 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:754550ad845f856ae535809f7876fa69727f888282a4c987082e75e1804cf2c6 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ad068a944fd21f587655f93f2bc6c41048d1541 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ac73982353abf4bda88444d4459393df0c9fe1c749f1fb039208e0785a47e08 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87ba1c7dc293982a4e8f0790f36714b4fe4e3807 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:818fe67472af00c61306863d0a49a9db3f5f90358b2aeb62e0a96b37b7fb4828 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3042bcdcb4d31c3b4fcb31a689017af39f7636b5 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f755104f11ca5db0e49f0622084762e53b704d257991cf4c37169dd2d32d1e9a +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..330b1747049420039810f05a9c790ee0e45788a1 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11b91af9ef3ce09ef7b0768d51776327afb3fffb1e35c7e6fbb5942981d7121b +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88c639f802968f166e81e855d6c7f56c4163271b --- /dev/null +++ b/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d25f38977e30f2c6d4c64bb6b776893bf6aacf911a54c76d7237266da00203d +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..247e9ecfd1f3da6ed8519177616bf685bb7153f1 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b189086dd3acc9ec14816b02f3492ddea149e5476eb15502e4ff526d9c6a54d +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1f996d0fe6f4b7f5728438347613ede8c176234 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a821cd4a0c5a0af28e6c0804871e7940791e96f4c088f1e3fc768da599a3a51c +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..257c78c39cc34accf90ab8e0ebd9525754e403eb --- /dev/null +++ b/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbf4f8d95c6064cdfc74e00a18e590f1e050b151ce9131765690a918ee422f87 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b17807c35211fae58b31ef7cc4082832200a701 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f979c85a3cba29f4452a163b9876bfe0ba58dd636969d4332270b586d647de4f +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..abc93055d4be2502659c62d72f1523a0bba9495c --- /dev/null +++ b/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d15f702507d8655b7b057a8ccbaada3868dcaebf669a83517f71cecbb07f665f +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64611cb0b4ec127b320ad628c042f94c9c228a70 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:494da5b4a497ff593be1fba8a68321f2ec53df6f970acf8d010459e642487005 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d10d5c55eded011e8aa9fc1098b4bcc211bf05af --- /dev/null +++ b/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0009960f31835e333ddc836ab01a8a3bb8214c77ec12b96316c91c66664e7e31 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0de4f8f1b5f7462f042cc63f8ad364df8061cd1 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4296299f8507e84870ecc96a0835ad4c3294a0aab983791f244c8e9b79f51bbe +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb8795fe4b4f25ed2a97426e8be689015cae6f53 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8eb3ba40037272ac983ec40fb3cd52d706055fcdd7c5f78503b47f926af9ad3 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6c334ef5456431ef8bb52cb96b8e2189895cead --- /dev/null +++ b/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37dd180b4359f310d97d5c281059b26ecba9b7ed6ce6d4a2923174d7d2fc78dd +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6572fb244e71efe1e145a4865167fcc50e8cc414 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ceb448027af93bd9501d7f64377627461c3237e53f5b9466b22e20360fd5f27 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2c73a0817ee7d98c6dacba0a2f1128f988f51b3 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad0a78a04b5bb0e70d8255d98fa8e9593d02b3f0b8b785fd47268cc71b8ae4f0 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d70ececf3744cdb7d1774d0b005dbf287559e853 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:270e352791b974adb74d74fd03d03c9282277c1001608680569d2dc2d42736f1 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6546e94974339b0ce6daab38984197b6d077db0 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a11a4827c29bead5c63565fe75e8424ed343332138457f2970bf618419d9cfb +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3878bf008c13801e514502b55fa2fdfc657f6462 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bf78e8d08f87b852425af5bf75ff91e552f65da8d5769e8eaf109cffa375245 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91eb00051981b70435680647f8c2421b62aee654 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dc2fc4e622a345724fa8f92fde4ee0d50e450c8656e7086e62682c1ac10f3de +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c52d2cf5fd6442ad256b3c6bf85641f1a70023df --- /dev/null +++ b/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b2839f93a6813dc9c8e1fe7b6f8dfae697a23ded2849fc9465b388e470a391f +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce2e2919926d417cee73933a6f617d06b4a9164f --- /dev/null +++ b/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17eb65cf9bdfe76634f1e0e7dcd672c8467844a897b9d69db5b410e8b95dff6a +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..283b617ce69eb0060a65f9a26558c2e7be7f0985 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df2e668e28eae5229c3c7a23da03492e8a37584116cfff514e45db9b24b99625 +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1de33eb37eca7a0180c76dc9ee8df1747adb4839 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94d82bed25e21ea95ebd417c2ffe743830211678356a2f9910b0c094b559d77e +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f3745b271142e9144624be90ef4bdfc9e71a237 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7499508fe11f1b1e03080cee7ccc19d42f486a39763f349fa1fb184dd80cc12d +size 201408771 diff --git a/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt b/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50daee852927d3231099db58aea6e861fd14c6a5 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce48e83ff39fe066d0f00ac2347b5829f0c8d7a39960bb1a99b4c0d94b0a2530 +size 17603 diff --git a/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt b/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff6905de33df9fc3392cdacad2d44339db1b1d20 --- /dev/null +++ b/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2cc13425a7b3d07b4cb35d01f2c654d17a6eed16d8a7c234c08a547fe8ff89c +size 17603 diff --git a/8b7178b58b/global_step84877/mp_rank_00_model_states.pt b/8b7178b58b/global_step84877/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2049f304f1fec1d4f50072dafc751e47affbe73 --- /dev/null +++ b/8b7178b58b/global_step84877/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8051eaecc967caa98c39c05006cdd257ca4a672986a5926ba5726399be6efef +size 40115 diff --git a/8b7178b58b/global_step84877/mp_rank_01_model_states.pt b/8b7178b58b/global_step84877/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a86400c78ae7fa97d8b51bd580157e36c0b77f16 --- /dev/null +++ b/8b7178b58b/global_step84877/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6526553dd2ea9fe6a49b87211e38911ceec00b8587926affc1849f45b96a5ba5 +size 40115 diff --git a/8b7178b58b/global_step84877/mp_rank_02_model_states.pt b/8b7178b58b/global_step84877/mp_rank_02_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33a311e0827db747bd0534a63541ca158811c4fa --- /dev/null +++ b/8b7178b58b/global_step84877/mp_rank_02_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5ba01be35cefcbf34fbaa3694f781c3bafe1be62b7aec7540b3a748ad77e5fe +size 40243 diff --git a/8b7178b58b/global_step84877/mp_rank_03_model_states.pt b/8b7178b58b/global_step84877/mp_rank_03_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d4a56481861ee47525b38e79b121b16d237bc75 --- /dev/null +++ b/8b7178b58b/global_step84877/mp_rank_03_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c81d502c6d7464bf878bdb7b84322f35d2bf8190c782fe72339d33d550cf030 +size 40243 diff --git a/8b7178b58b/transformers/config.json b/8b7178b58b/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..eadf3eb13cecae9db1c34cde4f4d373a9d0fe00f --- /dev/null +++ b/8b7178b58b/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 4096, "n_layer": 42, "n_head": 32, "n_inner": 16384, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/8b7178b58b/transformers/pytorch_model.bin b/8b7178b58b/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..0def92182624d8ba836623155249c56832777ee0 --- /dev/null +++ b/8b7178b58b/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf69e2f3ab8ce45fe8027c1223eabefad3da62d3de64a2ad3e657454f5127f5e +size 17698351197