diff --git a/.gitattributes b/.gitattributes index daec473f731fb78bd018c0deb6222035c7cee3e1..dca9c92ebecb5887bbe607ab624f89b1f096b09e 100644 --- a/.gitattributes +++ b/.gitattributes @@ -202,3 +202,27 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text 8b7178b178b/evaluation/generation/examples.8b7178b178b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text 8b7178b178b/evaluation/generation/examples.8b7178b178b_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text 8b7178b178b/evaluation/generation/examples.8b7178b178b_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text diff --git a/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-web_nlg_en_PALM_prompt_0.json b/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..0d265e7f87f3b76fc8e9e47571bf81a212515f29 --- /dev/null +++ b/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.4522375218061915, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04842537846111568}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.09405156373772382, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0036589357455526954}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2623187491640316, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0054853417994958405}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10639641446726286, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002372783014156511}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.04001471903798784, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002167193193860632}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.12482367655474384, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003329638916496446}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.047608492095606206, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001384256918874843}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.08735958257324784, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0035013157983101876}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2450465857818092, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.005156857986010396}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09811489729413486, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002141247906215953}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.08882938411931994, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0035668764760974714}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.24452754279908495, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.005065510424462396}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.0992851030641096, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022026560740801633}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-web_nlg_en_PALM_prompt_1.json b/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..cf4f32cc081753ba7b759a97e8da65c4a23d78b8 --- /dev/null +++ b/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.650629434960658, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04811417898690189}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.15916782201345867, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005131870879954661}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.29665725707782414, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005228319001095806}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.16281032775122675, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003905335709899557}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.07819648278455865, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0034063589997107026}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.15070155918572603, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003623729048520002}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.08120001213349398, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0026664765201647343}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.14191196636841233, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004635280920281775}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2736224046058516, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004816339822450663}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.14574992383080743, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003397730356308293}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.14648404402072937, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004776844963861229}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2774966849512831, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004834496186187873}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.14966591828719222, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.003504137587849123}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-web_nlg_en_PALM_prompt_2.json b/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..130613391cbcb6b1893abbd12a83b766276a513a --- /dev/null +++ b/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.9046528025555703, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04317473166983863}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.21014915270499354, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005813053226743566}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.35653672883727167, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0051494656409290275}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.2126025964717363, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004487229116514054}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.11091162929767316, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.003989043309470051}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.18668399640135247, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0039177512048306565}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.11056055329882854, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0031590233571128605}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.1825110333764981, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.005070346564582974}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.32304322748014636, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004678142532303707}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.18634690018126043, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0038448807973693925}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.18939634311269352, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.005258445068941222}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.32966626591290826, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004724502434373412}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.19202573601368517, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.003952591052036519}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-web_nlg_en_PALM_prompt_3.json b/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..3a548872a55a8a87a1759d224ed6365869c9868a --- /dev/null +++ b/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 1.1442800703272336, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05161996592570338}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.23213625362665477, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0059610834558063595}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.38062292481677, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005078282219671234}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.23508991254207284, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004629614568550998}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.12811335412630678, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.004200144761611546}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20379204157806646, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00386170912683119}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.12608234413935157, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.003256601130342381}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.1997394107463207, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.005153079376868987}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3397942315323993, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004538527029075319}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.20320672155464048, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003882337416765662}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.2083043346123531, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.005363455263356501}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.347929987856493, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0045764471921679985}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.21069756332821474, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.004028196190821567}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-web_nlg_en_PALM_prompt_4.json b/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..7e50a9a166e37f3663b4416db6322732d36f88be --- /dev/null +++ b/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 1.3793783786539846, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08292725693632953}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.25146617993410997, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.006199020027337637}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3925026283739189, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005116605241451321}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.25107613979636906, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00476323540590602}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.1385226844845104, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.004282956786141916}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.21131194271802842, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0040385627196912076}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.1354322190391961, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.003385535533668589}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.21425855000222013, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.005261027090142587}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.34988090714764264, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004590444333954342}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.2160535699510597, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003987483818543123}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.22545655976991655, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0055589913005229}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.36010176303537716, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0046603281582664625}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.22537108240785111, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.004170782290413772}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-web_nlg_en_PALM_prompt_5.json b/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..725e7bbf1687748e5aeeaa0659dc58bb136c1373 --- /dev/null +++ b/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 1.4145829791141218, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06756850302725374}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.25559388874117145, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.006265188037282814}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4014517195417289, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0052097160639095145}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.25726246836968625, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004880864665323261}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.1462902529413211, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.004502888503688928}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.22067604236758182, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0041554431177298085}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.1419903076188946, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.003491421839159055}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.21838534521953784, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.005386484846358847}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.35807492888309944, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004713215605602484}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.22145748379950564, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.004104691248611666}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.22909884605448813, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00564116547513353}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3686456415754311, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004784333349134369}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.2308946484376556, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.004281312884008834}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-wiki_lingua_en_tldr_en_0.json b/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..ee5e59d69060634b9850b60582c518799f1d7864 --- /dev/null +++ b/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1631004447259747, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0025140049334374266}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.24869580468026348, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0032277820635021014}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1810278543145764, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002359129908964426}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0385111191751266, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009986244610694906}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05950986614858929, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015515657908224004}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04284409748743667, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001036773633130634}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11812150163422086, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017909292945280444}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.18668011105548613, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002526858332113489}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1323060407446597, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001666744596513707}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.15149118025181801, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0023436532932745767}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.23193053314919995, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003047509010443981}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.16822692441451978, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021965424695315023}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.5768645983512664, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10390732312462625}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-wiki_lingua_en_tldr_en_1.json b/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..1b826738e60bbe8007c97afe4e5bc30b64b97bcc --- /dev/null +++ b/8b7178b13b/evaluation/generation/agg.8b7178b13b_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.24381809168774637, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0033022582237546634}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.23017687741596388, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028624354435880044}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.20446918503496525, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022069372036890365}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.064059693409422, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0018318331544901892}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05717654707897076, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015139726468610508}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05107550928141819, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012372719079850197}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.18545125118813593, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0026173569724847225}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1747030421481033, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022396644779822898}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15417240714255895, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001662532523275427}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.2280337645476899, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003112015382305472}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.21469429192649783, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026546326180329014}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.19083537889844354, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002054035558945731}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.2805418289148096, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06930736886640082}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/agg.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_0.json b/8b7178b13b/evaluation/generation/agg.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..a417e4cb75c283c027f55c05fae92a8023645089 --- /dev/null +++ b/8b7178b13b/evaluation/generation/agg.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 7.518228772851459, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07988589142118296}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.2527585937479932, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019586691047001085}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4532685157753863, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0036911339160002263}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.30892622395914193, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002362726614809891}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.10827294752994317, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0013193546727602984}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21206177532278597, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0024697648114498094}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.13957033665597848, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001587978757027655}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2074761734719538, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015484435087844478}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3707049758227277, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002992917144452656}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.25201104517465034, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018344182759923726}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.22367271169207667, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018161195853035582}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3994503148641263, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0034245642845668594}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2721367746591264, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002175228967316158}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/agg.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_1.json b/8b7178b13b/evaluation/generation/agg.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..3b34efa17ddb2db8b9e505659452285c6f956e08 --- /dev/null +++ b/8b7178b13b/evaluation/generation/agg.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.762713013802438, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09382576543199773}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5758411505584643, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032641614095776606}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.43699974124480134, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0030360517355224794}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4698359144705449, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023428195562317463}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.27339290904893143, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0027333405330301377}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.20425825992656632, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021962926617281136}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.21971297989413593, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020517231278393165}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4200242586753886, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0030278428531837543}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.31470569352158173, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002441278894908242}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3397129377482095, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020808579737579473}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4702024862705025, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0032151475190549403}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3555458059380285, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027838026083691135}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3826629288347234, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023388359390624446}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/agg.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_2.json b/8b7178b13b/evaluation/generation/agg.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..60901e8c2bb3643d446e2598abc6e8cd17dd9abc --- /dev/null +++ b/8b7178b13b/evaluation/generation/agg.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.028619911508963, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.17673898243267264}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5880328986485642, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031633644314478966}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4720615710167169, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0030042579734499103}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4982696315856735, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002277178664730148}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2905416018050732, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0027458331588556565}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2313719045642725, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002349650773654754}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2436824998963185, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021479952999434505}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4304826242102334, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002921537898047091}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.34359634632916913, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002538014950574236}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.36315580245879386, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021103667472393136}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4866663175226494, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003134734940667762}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.39070560600420967, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002859660656155989}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.41230819320152157, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023628359694983633}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/agg.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_3.json b/8b7178b13b/evaluation/generation/agg.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..e1ddb1528abd9e5db179a874193a6b959d93ea16 --- /dev/null +++ b/8b7178b13b/evaluation/generation/agg.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.824429124321526, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1257638219512965}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5903839264246126, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003096593178519806}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.48303754455261133, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029313776925495253}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5070937995389966, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021993659376666874}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2971819596009762, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0027204840509740583}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.24110048435208156, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002348630487706421}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2526618416523279, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021298129637362085}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.43347382731719464, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029257357889719074}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3529852168172252, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002550242635255893}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.37097982222923104, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00214061071940383}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.49123394352656125, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031248395828196904}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4020764458847546, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028446825862533704}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.42203281188344766, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023652228936698657}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/agg.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_4.json b/8b7178b13b/evaluation/generation/agg.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..ca1f8fff95b657b84adbe5efe16fd3fbec2965b4 --- /dev/null +++ b/8b7178b13b/evaluation/generation/agg.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 15.1456115809235, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1628753687758124}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5945998345487046, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003074613754297493}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.48854055206810637, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028822641580179367}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5145793651843434, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002244489356919281}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.29784097926829245, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026941678409656135}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2436337287979087, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023716503152493335}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2559926229244319, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002186356460577112}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.433653082379793, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002833488672483008}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3558030676746678, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025159494686373797}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3747326640922719, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002148508706418628}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.49357503577481815, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0030663612183832903}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4058018094790397, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002791634703514705}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.42740717670424816, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023775373903584217}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/agg.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_5.json b/8b7178b13b/evaluation/generation/agg.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..08dd18571632d6ecef362565a98334fa7e26281f --- /dev/null +++ b/8b7178b13b/evaluation/generation/agg.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 15.184590176560544, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.17570671649096134}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5980619294865127, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003055147702862821}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4899430329979205, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002838541142993511}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5172310679190623, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002187662941341786}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.3029600136699186, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002703515351522382}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.24620276831802643, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023264378571411816}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.259556048619835, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002143271876534031}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4380103729999666, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0028424300466825983}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.35795640195755224, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024826420662082673}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.37807698267399703, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002126725638562394}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4982942932710782, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0030594319184573462}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.40852131422574206, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027745302682206834}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4311732922825964, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023482937755900097}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/agg.8b7178b13b_gem_xsum_article_DOC_summary_0.json b/8b7178b13b/evaluation/generation/agg.8b7178b13b_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..de6967f0149c8eff6ca3ddab7ae0eabdda077cd3 --- /dev/null +++ b/8b7178b13b/evaluation/generation/agg.8b7178b13b_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.09160247708817207, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002375172469912284}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.19613476599918667, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005073318605110471}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.12067679782231505, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003015872334492621}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.015487063309988504, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000848981732321504}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0363837944571209, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0020790710888273895}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.021176795907655737, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011603757977784665}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.06937634282139736, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001813605739492327}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.1479963053053532, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0038099944087791725}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.09086726074181874, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0022256142858678965}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.07512656050190324, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001959507720128778}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.1612082948452722, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004219489865399336}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.09880097411831448, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024614730448775535}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.0840616150366835, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10220605780455636}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/agg.8b7178b13b_gem_xsum_article_DOC_summary_1.json b/8b7178b13b/evaluation/generation/agg.8b7178b13b_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..799b357c289cc8f019fac55ca2ab8f6ef5a48b58 --- /dev/null +++ b/8b7178b13b/evaluation/generation/agg.8b7178b13b_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.2003179694226108, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003646294986793581}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3082326819925303, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004421626418186149}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.22223912621847974, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003038126692025604}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.04617082546967428, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0021567164563758494}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07074171325045796, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0026782882522819163}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.050641256552544464, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002016315458850625}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.15020466828774898, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002974138334891651}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.23037723268498672, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0034903634923284257}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.16589957489115423, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0024349153804753905}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.156190697593295, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0029737943854797597}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2443326358730322, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003851152935036917}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.17413975005815832, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0025334465295397523}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.1144830791719307, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11445499213864452}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/agg.8b7178b13b_gem_xsum_article_DOC_summary_2.json b/8b7178b13b/evaluation/generation/agg.8b7178b13b_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..5f35565c17ab33d0d39f0af0866b14f7c7296cef --- /dev/null +++ b/8b7178b13b/evaluation/generation/agg.8b7178b13b_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.2167785998186487, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0038703703581663036}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.29079354607238944, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0042086230091149205}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.22874247828238384, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003191868132841587}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.05175962394844965, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002262457698273439}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06767519675126271, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002531468931801855}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.05359901469303583, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002063273466751458}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.1626685190790419, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003181540362928691}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2176434055764335, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0033468188991687773}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.17116883513373068, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002601631095778569}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.16752103628195428, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031476246457933605}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2286412427632142, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003582394216085152}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.17781283216267912, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0026319963165001175}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.2306956500254795, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1534426529740081}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_0.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d151d6f01826071d327dedbaa8d5e49ca18bdd8a --- /dev/null +++ b/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d542d21b668b90881e311067f0fade41d0e99bca2b1a03e3c2cb650caf2e3a9 +size 3701606 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_1.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0bdba2c6c90663daeab5d391c6ee97f6c037c2ba --- /dev/null +++ b/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dc929128d4969c62cc80aa03e4ec9df506381a503f1006e0086447d9053f708 +size 4526953 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_2.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8ada71423a9e23b742f35ce7f3d0ade7f435edd9 --- /dev/null +++ b/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7ae3dc212bd1cc2a21aaa72a4fcdc008cf8f49b3e39e0007f179f9d0a03314b +size 5434253 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_3.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5c66cf2144a963b0f45b88709de0f68cc5219aac --- /dev/null +++ b/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a703d0527c4db4dd0a2ee76bbaf675ee0ffa35d5e4dc1c712221531be43e3a53 +size 6314762 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_4.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7e0ee6d60db72335f713f146c00b17b52b6049e3 --- /dev/null +++ b/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa4773eaeafa4fcdfe6d345ccec98af9fd38bf4308ea8642891ff153a07b56d7 +size 7186302 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_5.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..875cbc2840dc3ad2e10fdbac446ad8610a194b43 --- /dev/null +++ b/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:818fcd13b019479e560b487cdbaba518378c3924c027fcdd9f3a7d4a20cabd7e +size 8081832 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-wiki_lingua_en_tldr_en_0.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..19b645b884b0f56ff0a6f6d59c82aad1af255c11 --- /dev/null +++ b/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58099176c35cec88e022d1c22e780678de0d16fae2edcc092463f9dba2724c07 +size 7555156 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-wiki_lingua_en_tldr_en_1.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f3d427b5d3374d8e05448cd5786800f34dc6059e --- /dev/null +++ b/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88c4678e45a42a488fc9db3f10447346c793ef85d4e1939c5be0c367388bb2dc +size 13021146 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-wiki_lingua_en_tldr_en_2.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-wiki_lingua_en_tldr_en_3.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-wiki_lingua_en_tldr_en_4.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-wiki_lingua_en_tldr_en_5.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..70fcaf0833ae870d232f7de60bc7c7e0da59a959 --- /dev/null +++ b/8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1187569a4616b479e1fc5aa9508a9017d2491b0a08161191611361dbb4aacade +size 4352329 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4bf97c07c8deb8b122011d79506177fa3fbc8a66 --- /dev/null +++ b/8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbed82d3acacfded166d7c820cd1baa44fbdd050ce64e0bc596e807d7d6a066e +size 5001088 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3435ab3968ebefb953c44d241d445ab2684485b4 --- /dev/null +++ b/8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09bacf7baa4961897e5e6928d3a0eb615cf2b0b2a00d6e700aa25e5c1866b586 +size 6099667 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..30bc1565ab0d8e9d98288ac9c472a137de257fe8 --- /dev/null +++ b/8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:975ddd44be0ce72a28793a5ad928128dd6abcf0488281dc3941fe4e919a1c634 +size 7187617 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..9f252a8fbef2b6d3fefb3d7e5de3c22541cebaf1 --- /dev/null +++ b/8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ab3596ed9a527667b7dd1747b6963e5d6c2941f57297b1e0055fae3e0d00744 +size 8265755 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8ee6967326d80d914375aca27e1c26837e674e31 --- /dev/null +++ b/8b7178b13b/evaluation/generation/examples.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac87d882575b5b56a379585db094a803629b1b8dc79521bc808a0580c596a29c +size 9352129 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_0.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..030a12e63fac763f893bbb0e66754c10f6a7505e --- /dev/null +++ b/8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11cbdf838c18198a69f1c12dd2cfc72b4762d016842811220c56735a31ed1ba8 +size 2744975 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_1.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2b0cf3da2577a37b1b4f29e91c0609f20737ffef --- /dev/null +++ b/8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fdf0e52e4bd35d09eb117e6f3bec08387f01d5fcebdb6962f57f2f4e803ac2c +size 5011713 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_2.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..dbf2cbc115ab33c48fae05ecd10c39a8f8b59707 --- /dev/null +++ b/8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee6974f94f3c6e92f55c1438fffbd467adecef14ccf6487fb827b2905fedfabd +size 7255905 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_3.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_4.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_5.jsonl b/8b7178b13b/evaluation/generation/examples.8b7178b13b_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-web_nlg_en_PALM_prompt_0.json b/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..89781ea415a8fe60336ac43544eb0a8c2b9335ef --- /dev/null +++ b/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.4522375218061915, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04842537846111568 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.09405156373772382, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0036589357455526954 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2623187491640316, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0054853417994958405 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10639641446726286, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002372783014156511 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.04001471903798784, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.002167193193860632 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.12482367655474384, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003329638916496446 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.047608492095606206, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001384256918874843 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.08735958257324784, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0035013157983101876 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2450465857818092, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.005156857986010396 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09811489729413486, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.002141247906215953 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.08882938411931994, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0035668764760974714 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.24452754279908495, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.005065510424462396 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.0992851030641096, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022026560740801633 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-web_nlg_en_PALM_prompt_1.json b/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..480d0e035395c7b503c67b39947f613039b6416d --- /dev/null +++ b/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.650629434960658, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04811417898690189 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.15916782201345867, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005131870879954661 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.29665725707782414, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005228319001095806 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.16281032775122675, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.003905335709899557 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.07819648278455865, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0034063589997107026 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.15070155918572603, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003623729048520002 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.08120001213349398, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0026664765201647343 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.14191196636841233, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004635280920281775 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2736224046058516, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004816339822450663 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.14574992383080743, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003397730356308293 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.14648404402072937, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004776844963861229 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2774966849512831, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004834496186187873 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.14966591828719222, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.003504137587849123 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-web_nlg_en_PALM_prompt_2.json b/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..98b175bb2cef37b9babecd3363fd764128e627fc --- /dev/null +++ b/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.9046528025555703, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04317473166983863 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.21014915270499354, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005813053226743566 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.35653672883727167, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0051494656409290275 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.2126025964717363, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004487229116514054 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.11091162929767316, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.003989043309470051 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.18668399640135247, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0039177512048306565 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.11056055329882854, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0031590233571128605 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.1825110333764981, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.005070346564582974 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.32304322748014636, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004678142532303707 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.18634690018126043, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0038448807973693925 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.18939634311269352, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.005258445068941222 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.32966626591290826, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004724502434373412 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.19202573601368517, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.003952591052036519 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-web_nlg_en_PALM_prompt_3.json b/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..ded309b30005d37774e6598bcadb81a26fc20a12 --- /dev/null +++ b/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 1.1442800703272336, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05161996592570338 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.23213625362665477, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0059610834558063595 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.38062292481677, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005078282219671234 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.23508991254207284, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004629614568550998 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.12811335412630678, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.004200144761611546 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20379204157806646, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.00386170912683119 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.12608234413935157, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.003256601130342381 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.1997394107463207, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.005153079376868987 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3397942315323993, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004538527029075319 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.20320672155464048, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003882337416765662 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.2083043346123531, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.005363455263356501 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.347929987856493, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0045764471921679985 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.21069756332821474, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.004028196190821567 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-web_nlg_en_PALM_prompt_4.json b/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..1269947398cd7ef991606ab0ee2e1cb0df430a1b --- /dev/null +++ b/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 1.3793783786539846, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.08292725693632953 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.25146617993410997, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.006199020027337637 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3925026283739189, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005116605241451321 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.25107613979636906, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.00476323540590602 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.1385226844845104, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.004282956786141916 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.21131194271802842, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0040385627196912076 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.1354322190391961, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.003385535533668589 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.21425855000222013, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.005261027090142587 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.34988090714764264, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004590444333954342 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.2160535699510597, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003987483818543123 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.22545655976991655, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0055589913005229 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.36010176303537716, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0046603281582664625 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.22537108240785111, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.004170782290413772 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-web_nlg_en_PALM_prompt_5.json b/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..ac8f207cee93ab42353a1763d32e1e258b63cfcb --- /dev/null +++ b/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 1.4145829791141218, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.06756850302725374 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.25559388874117145, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.006265188037282814 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4014517195417289, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0052097160639095145 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.25726246836968625, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004880864665323261 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.1462902529413211, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.004502888503688928 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.22067604236758182, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0041554431177298085 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.1419903076188946, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.003491421839159055 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.21838534521953784, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.005386484846358847 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.35807492888309944, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004713215605602484 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.22145748379950564, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.004104691248611666 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.22909884605448813, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.00564116547513353 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3686456415754311, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004784333349134369 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.2308946484376556, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.004281312884008834 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-wiki_lingua_en_tldr_en_0.json b/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..76c30d6ca650ff06b552f0f2b98b961ba261bdaa --- /dev/null +++ b/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1631004447259747, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0025140049334374266 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.24869580468026348, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0032277820635021014 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1810278543145764, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002359129908964426 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0385111191751266, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009986244610694906 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05950986614858929, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015515657908224004 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04284409748743667, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001036773633130634 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11812150163422086, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0017909292945280444 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.18668011105548613, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002526858332113489 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1323060407446597, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001666744596513707 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.15149118025181801, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0023436532932745767 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.23193053314919995, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.003047509010443981 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.16822692441451978, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0021965424695315023 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.5768645983512664, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.10390732312462625 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-wiki_lingua_en_tldr_en_1.json b/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..21aa2e170c51a08648129163e28da97250ba6b0c --- /dev/null +++ b/8b7178b13b/evaluation/generation/slim.8b7178b13b_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.24381809168774637, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0033022582237546634 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.23017687741596388, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0028624354435880044 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.20446918503496525, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0022069372036890365 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.064059693409422, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0018318331544901892 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05717654707897076, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015139726468610508 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05107550928141819, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012372719079850197 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.18545125118813593, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0026173569724847225 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1747030421481033, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022396644779822898 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15417240714255895, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001662532523275427 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.2280337645476899, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.003112015382305472 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.21469429192649783, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0026546326180329014 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.19083537889844354, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002054035558945731 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.2805418289148096, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.06930736886640082 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/slim.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_0.json b/8b7178b13b/evaluation/generation/slim.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..d64a87eb8f8c05684e1c46f917b56ea5f33fd12a --- /dev/null +++ b/8b7178b13b/evaluation/generation/slim.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 7.518228772851459, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.07988589142118296 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.2527585937479932, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0019586691047001085 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4532685157753863, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0036911339160002263 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.30892622395914193, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002362726614809891 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.10827294752994317, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0013193546727602984 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21206177532278597, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0024697648114498094 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.13957033665597848, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001587978757027655 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2074761734719538, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0015484435087844478 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3707049758227277, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002992917144452656 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.25201104517465034, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0018344182759923726 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.22367271169207667, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0018161195853035582 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3994503148641263, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0034245642845668594 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2721367746591264, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002175228967316158 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/slim.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_1.json b/8b7178b13b/evaluation/generation/slim.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..a8dd8b909340548d566d4816de4f4e659d22f0d9 --- /dev/null +++ b/8b7178b13b/evaluation/generation/slim.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.762713013802438, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.09382576543199773 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5758411505584643, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032641614095776606 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.43699974124480134, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0030360517355224794 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4698359144705449, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0023428195562317463 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.27339290904893143, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0027333405330301377 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.20425825992656632, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021962926617281136 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.21971297989413593, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020517231278393165 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4200242586753886, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0030278428531837543 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.31470569352158173, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002441278894908242 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3397129377482095, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020808579737579473 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4702024862705025, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0032151475190549403 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3555458059380285, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027838026083691135 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3826629288347234, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023388359390624446 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/slim.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_2.json b/8b7178b13b/evaluation/generation/slim.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..5cedb803f7a23200f0dd9299c0556eb3a89657b0 --- /dev/null +++ b/8b7178b13b/evaluation/generation/slim.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.028619911508963, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.17673898243267264 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5880328986485642, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031633644314478966 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4720615710167169, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0030042579734499103 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4982696315856735, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002277178664730148 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2905416018050732, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0027458331588556565 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2313719045642725, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002349650773654754 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2436824998963185, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0021479952999434505 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4304826242102334, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002921537898047091 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.34359634632916913, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002538014950574236 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.36315580245879386, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021103667472393136 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4866663175226494, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003134734940667762 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.39070560600420967, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002859660656155989 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.41230819320152157, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023628359694983633 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/slim.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_3.json b/8b7178b13b/evaluation/generation/slim.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..2599128a5371ba714341e1bbd42f62b8720e158e --- /dev/null +++ b/8b7178b13b/evaluation/generation/slim.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.824429124321526, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1257638219512965 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5903839264246126, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003096593178519806 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.48303754455261133, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029313776925495253 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5070937995389966, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0021993659376666874 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2971819596009762, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0027204840509740583 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.24110048435208156, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002348630487706421 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2526618416523279, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0021298129637362085 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.43347382731719464, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029257357889719074 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3529852168172252, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002550242635255893 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.37097982222923104, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.00214061071940383 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.49123394352656125, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031248395828196904 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4020764458847546, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0028446825862533704 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.42203281188344766, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023652228936698657 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/slim.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_4.json b/8b7178b13b/evaluation/generation/slim.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..45853c75d240e024359b545055c00388b058b14d --- /dev/null +++ b/8b7178b13b/evaluation/generation/slim.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 15.1456115809235, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1628753687758124 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5945998345487046, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003074613754297493 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.48854055206810637, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028822641580179367 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5145793651843434, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002244489356919281 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.29784097926829245, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026941678409656135 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2436337287979087, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023716503152493335 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2559926229244319, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002186356460577112 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.433653082379793, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002833488672483008 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3558030676746678, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025159494686373797 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3747326640922719, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002148508706418628 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.49357503577481815, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0030663612183832903 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4058018094790397, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002791634703514705 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.42740717670424816, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023775373903584217 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/slim.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_5.json b/8b7178b13b/evaluation/generation/slim.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..ca14136848019558a7caaa5a3f5b5e111f2979d1 --- /dev/null +++ b/8b7178b13b/evaluation/generation/slim.8b7178b13b_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 15.184590176560544, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.17570671649096134 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5980619294865127, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003055147702862821 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4899430329979205, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002838541142993511 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5172310679190623, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002187662941341786 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.3029600136699186, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002703515351522382 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.24620276831802643, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023264378571411816 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.259556048619835, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002143271876534031 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4380103729999666, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0028424300466825983 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.35795640195755224, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024826420662082673 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.37807698267399703, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002126725638562394 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4982942932710782, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0030594319184573462 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.40852131422574206, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027745302682206834 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4311732922825964, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023482937755900097 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/slim.8b7178b13b_gem_xsum_article_DOC_summary_0.json b/8b7178b13b/evaluation/generation/slim.8b7178b13b_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..8b61a011b1173bbe3c0861c6abbc38d7193a6032 --- /dev/null +++ b/8b7178b13b/evaluation/generation/slim.8b7178b13b_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.09160247708817207, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002375172469912284 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.19613476599918667, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.005073318605110471 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.12067679782231505, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.003015872334492621 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.015487063309988504, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.000848981732321504 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0363837944571209, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0020790710888273895 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.021176795907655737, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0011603757977784665 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.06937634282139736, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001813605739492327 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.1479963053053532, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0038099944087791725 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.09086726074181874, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0022256142858678965 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.07512656050190324, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001959507720128778 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.1612082948452722, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.004219489865399336 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.09880097411831448, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0024614730448775535 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.0840616150366835, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.10220605780455636 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/slim.8b7178b13b_gem_xsum_article_DOC_summary_1.json b/8b7178b13b/evaluation/generation/slim.8b7178b13b_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..2c40ba1bd69a5930770dc68b778cd22d17d81c71 --- /dev/null +++ b/8b7178b13b/evaluation/generation/slim.8b7178b13b_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.2003179694226108, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.003646294986793581 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3082326819925303, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004421626418186149 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.22223912621847974, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.003038126692025604 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.04617082546967428, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0021567164563758494 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07074171325045796, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0026782882522819163 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.050641256552544464, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.002016315458850625 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.15020466828774898, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.002974138334891651 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.23037723268498672, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0034903634923284257 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.16589957489115423, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0024349153804753905 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.156190697593295, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0029737943854797597 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2443326358730322, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003851152935036917 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.17413975005815832, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0025334465295397523 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.1144830791719307, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.11445499213864452 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/generation/slim.8b7178b13b_gem_xsum_article_DOC_summary_2.json b/8b7178b13b/evaluation/generation/slim.8b7178b13b_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..6786e47892c76ae64abd3c238da34f82e3639678 --- /dev/null +++ b/8b7178b13b/evaluation/generation/slim.8b7178b13b_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.2167785998186487, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0038703703581663036 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.29079354607238944, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0042086230091149205 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.22874247828238384, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.003191868132841587 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.05175962394844965, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.002262457698273439 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06767519675126271, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002531468931801855 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.05359901469303583, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.002063273466751458 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.1626685190790419, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.003181540362928691 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2176434055764335, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0033468188991687773 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.17116883513373068, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002601631095778569 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.16752103628195428, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0031476246457933605 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2286412427632142, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003582394216085152 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.17781283216267912, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0026319963165001175 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.2306956500254795, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.1534426529740081 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b13b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/rankeval/8b7178b13b_0.json b/8b7178b13b/evaluation/rankeval/8b7178b13b_0.json new file mode 100644 index 0000000000000000000000000000000000000000..8ce17533780c8f358c9be167337acd8af6dbb1a0 --- /dev/null +++ b/8b7178b13b/evaluation/rankeval/8b7178b13b_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.354, + "acc_stderr": 0.015129868238451773 + }, + "anli_r2": { + "acc": 0.331, + "acc_stderr": 0.01488827258820394 + }, + "anli_r3": { + "acc": 0.3458333333333333, + "acc_stderr": 0.01373624534231101 + }, + "cb": { + "acc": 0.2857142857142857, + "acc_stderr": 0.06091449038731724, + "f1": 0.30952380952380953 + }, + "copa": { + "acc": 0.7, + "acc_stderr": 0.046056618647183814 + }, + "hellaswag": { + "acc": 0.4360685122485561, + "acc_stderr": 0.004948824501355485, + "acc_norm": 0.5632344154550887, + "acc_norm_stderr": 0.004949716368890496 + }, + "rte": { + "acc": 0.5306859205776173, + "acc_stderr": 0.03003973059219781 + }, + "winogrande": { + "acc": 0.5666929755327546, + "acc_stderr": 0.013926915052757347 + }, + "storycloze_2016": { + "acc": 0.6969535008017104, + "acc_stderr": 0.010627613073376715 + }, + "boolq": { + "acc": 0.5501529051987768, + "acc_stderr": 0.008700950643028801 + }, + "arc_easy": { + "acc": 0.5707070707070707, + "acc_stderr": 0.010156678075911087, + "acc_norm": 0.5172558922558923, + "acc_norm_stderr": 0.010253671674754631 + }, + "arc_challenge": { + "acc": 0.2721843003412969, + "acc_stderr": 0.013006600406423707, + "acc_norm": 0.2832764505119454, + "acc_norm_stderr": 0.013167478735134575 + }, + "sciq": { + "acc": 0.848, + "acc_stderr": 0.011358918303475282, + "acc_norm": 0.758, + "acc_norm_stderr": 0.013550631705555958 + }, + "piqa": { + "acc": 0.7225244831338411, + "acc_stderr": 0.010446818281039959, + "acc_norm": 0.7317736670293797, + "acc_norm_stderr": 0.010336761992404485 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/rankeval/8b7178b13b_0_lm-eval_global_step84877_2023-05-15-10-06-37_0shots_backup.json b/8b7178b13b/evaluation/rankeval/8b7178b13b_0_lm-eval_global_step84877_2023-05-15-10-06-37_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..8ce17533780c8f358c9be167337acd8af6dbb1a0 --- /dev/null +++ b/8b7178b13b/evaluation/rankeval/8b7178b13b_0_lm-eval_global_step84877_2023-05-15-10-06-37_0shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.354, + "acc_stderr": 0.015129868238451773 + }, + "anli_r2": { + "acc": 0.331, + "acc_stderr": 0.01488827258820394 + }, + "anli_r3": { + "acc": 0.3458333333333333, + "acc_stderr": 0.01373624534231101 + }, + "cb": { + "acc": 0.2857142857142857, + "acc_stderr": 0.06091449038731724, + "f1": 0.30952380952380953 + }, + "copa": { + "acc": 0.7, + "acc_stderr": 0.046056618647183814 + }, + "hellaswag": { + "acc": 0.4360685122485561, + "acc_stderr": 0.004948824501355485, + "acc_norm": 0.5632344154550887, + "acc_norm_stderr": 0.004949716368890496 + }, + "rte": { + "acc": 0.5306859205776173, + "acc_stderr": 0.03003973059219781 + }, + "winogrande": { + "acc": 0.5666929755327546, + "acc_stderr": 0.013926915052757347 + }, + "storycloze_2016": { + "acc": 0.6969535008017104, + "acc_stderr": 0.010627613073376715 + }, + "boolq": { + "acc": 0.5501529051987768, + "acc_stderr": 0.008700950643028801 + }, + "arc_easy": { + "acc": 0.5707070707070707, + "acc_stderr": 0.010156678075911087, + "acc_norm": 0.5172558922558923, + "acc_norm_stderr": 0.010253671674754631 + }, + "arc_challenge": { + "acc": 0.2721843003412969, + "acc_stderr": 0.013006600406423707, + "acc_norm": 0.2832764505119454, + "acc_norm_stderr": 0.013167478735134575 + }, + "sciq": { + "acc": 0.848, + "acc_stderr": 0.011358918303475282, + "acc_norm": 0.758, + "acc_norm_stderr": 0.013550631705555958 + }, + "piqa": { + "acc": 0.7225244831338411, + "acc_stderr": 0.010446818281039959, + "acc_norm": 0.7317736670293797, + "acc_norm_stderr": 0.010336761992404485 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/rankeval/8b7178b13b_1.json b/8b7178b13b/evaluation/rankeval/8b7178b13b_1.json new file mode 100644 index 0000000000000000000000000000000000000000..7c5e0809944d832c5cf497fea1ecdc9b4c0a1da1 --- /dev/null +++ b/8b7178b13b/evaluation/rankeval/8b7178b13b_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r2": { + "acc": 0.326, + "acc_stderr": 0.014830507204541028 + }, + "anli_r3": { + "acc": 0.3541666666666667, + "acc_stderr": 0.01381193349957096 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.36324786324786323 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.4411471818362876, + "acc_stderr": 0.004955095096264714, + "acc_norm": 0.5774746066520613, + "acc_norm_stderr": 0.004929517011508216 + }, + "rte": { + "acc": 0.5234657039711191, + "acc_stderr": 0.030063300411902652 + }, + "winogrande": { + "acc": 0.5595895816890292, + "acc_stderr": 0.013952330311915603 + }, + "storycloze_2016": { + "acc": 0.6830571886691609, + "acc_stderr": 0.010759650951452121 + }, + "boolq": { + "acc": 0.5562691131498471, + "acc_stderr": 0.008689501105367413 + }, + "arc_easy": { + "acc": 0.5968013468013468, + "acc_stderr": 0.010065668576794803, + "acc_norm": 0.5913299663299664, + "acc_norm_stderr": 0.01008717449876288 + }, + "arc_challenge": { + "acc": 0.27474402730375425, + "acc_stderr": 0.013044617212771227, + "acc_norm": 0.3037542662116041, + "acc_norm_stderr": 0.01343890918477876 + }, + "sciq": { + "acc": 0.887, + "acc_stderr": 0.010016552866696846, + "acc_norm": 0.882, + "acc_norm_stderr": 0.01020686926438179 + }, + "piqa": { + "acc": 0.7295973884657236, + "acc_stderr": 0.010363167031620784, + "acc_norm": 0.7334058759521219, + "acc_norm_stderr": 0.010316749863541365 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/rankeval/8b7178b13b_1_lm-eval_global_step84877_2023-05-15-10-06-37_1shots_backup.json b/8b7178b13b/evaluation/rankeval/8b7178b13b_1_lm-eval_global_step84877_2023-05-15-10-06-37_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..7c5e0809944d832c5cf497fea1ecdc9b4c0a1da1 --- /dev/null +++ b/8b7178b13b/evaluation/rankeval/8b7178b13b_1_lm-eval_global_step84877_2023-05-15-10-06-37_1shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r2": { + "acc": 0.326, + "acc_stderr": 0.014830507204541028 + }, + "anli_r3": { + "acc": 0.3541666666666667, + "acc_stderr": 0.01381193349957096 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.36324786324786323 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.4411471818362876, + "acc_stderr": 0.004955095096264714, + "acc_norm": 0.5774746066520613, + "acc_norm_stderr": 0.004929517011508216 + }, + "rte": { + "acc": 0.5234657039711191, + "acc_stderr": 0.030063300411902652 + }, + "winogrande": { + "acc": 0.5595895816890292, + "acc_stderr": 0.013952330311915603 + }, + "storycloze_2016": { + "acc": 0.6830571886691609, + "acc_stderr": 0.010759650951452121 + }, + "boolq": { + "acc": 0.5562691131498471, + "acc_stderr": 0.008689501105367413 + }, + "arc_easy": { + "acc": 0.5968013468013468, + "acc_stderr": 0.010065668576794803, + "acc_norm": 0.5913299663299664, + "acc_norm_stderr": 0.01008717449876288 + }, + "arc_challenge": { + "acc": 0.27474402730375425, + "acc_stderr": 0.013044617212771227, + "acc_norm": 0.3037542662116041, + "acc_norm_stderr": 0.01343890918477876 + }, + "sciq": { + "acc": 0.887, + "acc_stderr": 0.010016552866696846, + "acc_norm": 0.882, + "acc_norm_stderr": 0.01020686926438179 + }, + "piqa": { + "acc": 0.7295973884657236, + "acc_stderr": 0.010363167031620784, + "acc_norm": 0.7334058759521219, + "acc_norm_stderr": 0.010316749863541365 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/rankeval/8b7178b13b_2.json b/8b7178b13b/evaluation/rankeval/8b7178b13b_2.json new file mode 100644 index 0000000000000000000000000000000000000000..34afc508d14f0aa5b4f51ff0ded9a129e1554170 --- /dev/null +++ b/8b7178b13b/evaluation/rankeval/8b7178b13b_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.343, + "acc_stderr": 0.015019206922356951 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.014976758771620349 + }, + "anli_r3": { + "acc": 0.33416666666666667, + "acc_stderr": 0.013622434813136774 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.30617283950617286 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.4419438358892651, + "acc_stderr": 0.004956030970911519, + "acc_norm": 0.5717984465245967, + "acc_norm_stderr": 0.004938068627349502 + }, + "rte": { + "acc": 0.4404332129963899, + "acc_stderr": 0.029882123363118726 + }, + "winogrande": { + "acc": 0.5382794001578532, + "acc_stderr": 0.014011242594964115 + }, + "storycloze_2016": { + "acc": 0.6862640299305185, + "acc_stderr": 0.01073017911931762 + }, + "boolq": { + "acc": 0.5529051987767584, + "acc_stderr": 0.008695963064172717 + }, + "arc_easy": { + "acc": 0.6077441077441077, + "acc_stderr": 0.010018744689650043, + "acc_norm": 0.6026936026936027, + "acc_norm_stderr": 0.010041053078884286 + }, + "arc_challenge": { + "acc": 0.28924914675767915, + "acc_stderr": 0.013250012579393443, + "acc_norm": 0.310580204778157, + "acc_norm_stderr": 0.013522292098053059 + }, + "sciq": { + "acc": 0.914, + "acc_stderr": 0.008870325962594766, + "acc_norm": 0.908, + "acc_norm_stderr": 0.009144376393151108 + }, + "piqa": { + "acc": 0.7295973884657236, + "acc_stderr": 0.010363167031620784, + "acc_norm": 0.735038084874864, + "acc_norm_stderr": 0.010296557993316042 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/rankeval/8b7178b13b_2_lm-eval_global_step84877_2023-05-15-10-06-37_2shots_backup.json b/8b7178b13b/evaluation/rankeval/8b7178b13b_2_lm-eval_global_step84877_2023-05-15-10-06-37_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..34afc508d14f0aa5b4f51ff0ded9a129e1554170 --- /dev/null +++ b/8b7178b13b/evaluation/rankeval/8b7178b13b_2_lm-eval_global_step84877_2023-05-15-10-06-37_2shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.343, + "acc_stderr": 0.015019206922356951 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.014976758771620349 + }, + "anli_r3": { + "acc": 0.33416666666666667, + "acc_stderr": 0.013622434813136774 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.30617283950617286 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.4419438358892651, + "acc_stderr": 0.004956030970911519, + "acc_norm": 0.5717984465245967, + "acc_norm_stderr": 0.004938068627349502 + }, + "rte": { + "acc": 0.4404332129963899, + "acc_stderr": 0.029882123363118726 + }, + "winogrande": { + "acc": 0.5382794001578532, + "acc_stderr": 0.014011242594964115 + }, + "storycloze_2016": { + "acc": 0.6862640299305185, + "acc_stderr": 0.01073017911931762 + }, + "boolq": { + "acc": 0.5529051987767584, + "acc_stderr": 0.008695963064172717 + }, + "arc_easy": { + "acc": 0.6077441077441077, + "acc_stderr": 0.010018744689650043, + "acc_norm": 0.6026936026936027, + "acc_norm_stderr": 0.010041053078884286 + }, + "arc_challenge": { + "acc": 0.28924914675767915, + "acc_stderr": 0.013250012579393443, + "acc_norm": 0.310580204778157, + "acc_norm_stderr": 0.013522292098053059 + }, + "sciq": { + "acc": 0.914, + "acc_stderr": 0.008870325962594766, + "acc_norm": 0.908, + "acc_norm_stderr": 0.009144376393151108 + }, + "piqa": { + "acc": 0.7295973884657236, + "acc_stderr": 0.010363167031620784, + "acc_norm": 0.735038084874864, + "acc_norm_stderr": 0.010296557993316042 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/rankeval/8b7178b13b_3.json b/8b7178b13b/evaluation/rankeval/8b7178b13b_3.json new file mode 100644 index 0000000000000000000000000000000000000000..0129ce153d4301d7475f23bcd0f438c2b74ad82b --- /dev/null +++ b/8b7178b13b/evaluation/rankeval/8b7178b13b_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.344, + "acc_stderr": 0.015029633724408945 + }, + "anli_r2": { + "acc": 0.365, + "acc_stderr": 0.0152317762262649 + }, + "anli_r3": { + "acc": 0.3333333333333333, + "acc_stderr": 0.013613950010225612 + }, + "cb": { + "acc": 0.44642857142857145, + "acc_stderr": 0.06703189227942398, + "f1": 0.428030303030303 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.04408440022768079 + }, + "hellaswag": { + "acc": 0.4431388169687313, + "acc_stderr": 0.004957410545559414, + "acc_norm": 0.58105954989046, + "acc_norm_stderr": 0.004923772581848488 + }, + "rte": { + "acc": 0.48736462093862815, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5556432517758485, + "acc_stderr": 0.013965196769083555 + }, + "storycloze_2016": { + "acc": 0.6916087653661144, + "acc_stderr": 0.010679734445487801 + }, + "boolq": { + "acc": 0.5314984709480123, + "acc_stderr": 0.00872768484861531 + }, + "arc_easy": { + "acc": 0.6077441077441077, + "acc_stderr": 0.010018744689650043, + "acc_norm": 0.6022727272727273, + "acc_norm_stderr": 0.010042861602178056 + }, + "arc_challenge": { + "acc": 0.2858361774744027, + "acc_stderr": 0.013203196088537369, + "acc_norm": 0.3037542662116041, + "acc_norm_stderr": 0.01343890918477876 + }, + "sciq": { + "acc": 0.913, + "acc_stderr": 0.008916866630745923, + "acc_norm": 0.911, + "acc_norm_stderr": 0.009008893392651518 + }, + "piqa": { + "acc": 0.7323177366702938, + "acc_stderr": 0.010330111189370429, + "acc_norm": 0.735038084874864, + "acc_norm_stderr": 0.010296557993316044 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/rankeval/8b7178b13b_3_lm-eval_global_step84877_2023-05-15-10-06-37_3shots_backup.json b/8b7178b13b/evaluation/rankeval/8b7178b13b_3_lm-eval_global_step84877_2023-05-15-10-06-37_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..0129ce153d4301d7475f23bcd0f438c2b74ad82b --- /dev/null +++ b/8b7178b13b/evaluation/rankeval/8b7178b13b_3_lm-eval_global_step84877_2023-05-15-10-06-37_3shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.344, + "acc_stderr": 0.015029633724408945 + }, + "anli_r2": { + "acc": 0.365, + "acc_stderr": 0.0152317762262649 + }, + "anli_r3": { + "acc": 0.3333333333333333, + "acc_stderr": 0.013613950010225612 + }, + "cb": { + "acc": 0.44642857142857145, + "acc_stderr": 0.06703189227942398, + "f1": 0.428030303030303 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.04408440022768079 + }, + "hellaswag": { + "acc": 0.4431388169687313, + "acc_stderr": 0.004957410545559414, + "acc_norm": 0.58105954989046, + "acc_norm_stderr": 0.004923772581848488 + }, + "rte": { + "acc": 0.48736462093862815, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5556432517758485, + "acc_stderr": 0.013965196769083555 + }, + "storycloze_2016": { + "acc": 0.6916087653661144, + "acc_stderr": 0.010679734445487801 + }, + "boolq": { + "acc": 0.5314984709480123, + "acc_stderr": 0.00872768484861531 + }, + "arc_easy": { + "acc": 0.6077441077441077, + "acc_stderr": 0.010018744689650043, + "acc_norm": 0.6022727272727273, + "acc_norm_stderr": 0.010042861602178056 + }, + "arc_challenge": { + "acc": 0.2858361774744027, + "acc_stderr": 0.013203196088537369, + "acc_norm": 0.3037542662116041, + "acc_norm_stderr": 0.01343890918477876 + }, + "sciq": { + "acc": 0.913, + "acc_stderr": 0.008916866630745923, + "acc_norm": 0.911, + "acc_norm_stderr": 0.009008893392651518 + }, + "piqa": { + "acc": 0.7323177366702938, + "acc_stderr": 0.010330111189370429, + "acc_norm": 0.735038084874864, + "acc_norm_stderr": 0.010296557993316044 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/rankeval/8b7178b13b_4.json b/8b7178b13b/evaluation/rankeval/8b7178b13b_4.json new file mode 100644 index 0000000000000000000000000000000000000000..c883ab101ddcbfa8f37bb65ab04cae9858e4b663 --- /dev/null +++ b/8b7178b13b/evaluation/rankeval/8b7178b13b_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.363, + "acc_stderr": 0.015213890444671283 + }, + "anli_r2": { + "acc": 0.362, + "acc_stderr": 0.0152048409129195 + }, + "anli_r3": { + "acc": 0.3516666666666667, + "acc_stderr": 0.013789711695404806 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.3340305010893247 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.04408440022768078 + }, + "hellaswag": { + "acc": 0.44064927305317664, + "acc_stderr": 0.004954503606471609, + "acc_norm": 0.5764787890858395, + "acc_norm_stderr": 0.004931065434173691 + }, + "rte": { + "acc": 0.44765342960288806, + "acc_stderr": 0.029931070362939526 + }, + "winogrande": { + "acc": 0.5501183898973955, + "acc_stderr": 0.013981711904049732 + }, + "storycloze_2016": { + "acc": 0.6932121859967931, + "acc_stderr": 0.010664275190473634 + }, + "boolq": { + "acc": 0.5162079510703363, + "acc_stderr": 0.008740459157499082 + }, + "arc_easy": { + "acc": 0.6203703703703703, + "acc_stderr": 0.009958037725468565, + "acc_norm": 0.6085858585858586, + "acc_norm_stderr": 0.010014917532627824 + }, + "arc_challenge": { + "acc": 0.27559726962457337, + "acc_stderr": 0.013057169655761838, + "acc_norm": 0.31313993174061433, + "acc_norm_stderr": 0.013552671543623501 + }, + "sciq": { + "acc": 0.91, + "acc_stderr": 0.009054390204866444, + "acc_norm": 0.914, + "acc_norm_stderr": 0.008870325962594766 + }, + "piqa": { + "acc": 0.7285092491838956, + "acc_stderr": 0.010376251176596135, + "acc_norm": 0.7393906420021763, + "acc_norm_stderr": 0.010241826155811632 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/rankeval/8b7178b13b_4_lm-eval_global_step84877_2023-05-15-10-07-32_4shots_backup.json b/8b7178b13b/evaluation/rankeval/8b7178b13b_4_lm-eval_global_step84877_2023-05-15-10-07-32_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..c883ab101ddcbfa8f37bb65ab04cae9858e4b663 --- /dev/null +++ b/8b7178b13b/evaluation/rankeval/8b7178b13b_4_lm-eval_global_step84877_2023-05-15-10-07-32_4shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.363, + "acc_stderr": 0.015213890444671283 + }, + "anli_r2": { + "acc": 0.362, + "acc_stderr": 0.0152048409129195 + }, + "anli_r3": { + "acc": 0.3516666666666667, + "acc_stderr": 0.013789711695404806 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.3340305010893247 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.04408440022768078 + }, + "hellaswag": { + "acc": 0.44064927305317664, + "acc_stderr": 0.004954503606471609, + "acc_norm": 0.5764787890858395, + "acc_norm_stderr": 0.004931065434173691 + }, + "rte": { + "acc": 0.44765342960288806, + "acc_stderr": 0.029931070362939526 + }, + "winogrande": { + "acc": 0.5501183898973955, + "acc_stderr": 0.013981711904049732 + }, + "storycloze_2016": { + "acc": 0.6932121859967931, + "acc_stderr": 0.010664275190473634 + }, + "boolq": { + "acc": 0.5162079510703363, + "acc_stderr": 0.008740459157499082 + }, + "arc_easy": { + "acc": 0.6203703703703703, + "acc_stderr": 0.009958037725468565, + "acc_norm": 0.6085858585858586, + "acc_norm_stderr": 0.010014917532627824 + }, + "arc_challenge": { + "acc": 0.27559726962457337, + "acc_stderr": 0.013057169655761838, + "acc_norm": 0.31313993174061433, + "acc_norm_stderr": 0.013552671543623501 + }, + "sciq": { + "acc": 0.91, + "acc_stderr": 0.009054390204866444, + "acc_norm": 0.914, + "acc_norm_stderr": 0.008870325962594766 + }, + "piqa": { + "acc": 0.7285092491838956, + "acc_stderr": 0.010376251176596135, + "acc_norm": 0.7393906420021763, + "acc_norm_stderr": 0.010241826155811632 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/rankeval/8b7178b13b_5.json b/8b7178b13b/evaluation/rankeval/8b7178b13b_5.json new file mode 100644 index 0000000000000000000000000000000000000000..76f82522b12f592b48bb6adbe292a33f8ac74bb4 --- /dev/null +++ b/8b7178b13b/evaluation/rankeval/8b7178b13b_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.359, + "acc_stderr": 0.015177264224798601 + }, + "anli_r2": { + "acc": 0.335, + "acc_stderr": 0.014933117490932573 + }, + "anli_r3": { + "acc": 0.3258333333333333, + "acc_stderr": 0.013535422043417454 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.38723751912112364 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932262 + }, + "hellaswag": { + "acc": 0.44343756223859787, + "acc_stderr": 0.0049577508971529426, + "acc_norm": 0.5806612228639714, + "acc_norm_stderr": 0.004924424018073683 + }, + "rte": { + "acc": 0.48014440433212996, + "acc_stderr": 0.0300727231673172 + }, + "winogrande": { + "acc": 0.5540647198105761, + "acc_stderr": 0.013970093482330697 + }, + "storycloze_2016": { + "acc": 0.6937466595403528, + "acc_stderr": 0.010659088460112754 + }, + "boolq": { + "acc": 0.519571865443425, + "acc_stderr": 0.008738352682962235 + }, + "arc_easy": { + "acc": 0.6094276094276094, + "acc_stderr": 0.010011059112064243, + "acc_norm": 0.6119528619528619, + "acc_norm_stderr": 0.009999295905750666 + }, + "arc_challenge": { + "acc": 0.2832764505119454, + "acc_stderr": 0.013167478735134575, + "acc_norm": 0.3165529010238908, + "acc_norm_stderr": 0.01359243151906808 + }, + "sciq": { + "acc": 0.913, + "acc_stderr": 0.008916866630745925, + "acc_norm": 0.917, + "acc_norm_stderr": 0.00872852720607479 + }, + "piqa": { + "acc": 0.7247007616974973, + "acc_stderr": 0.01042142927736953, + "acc_norm": 0.7393906420021763, + "acc_norm_stderr": 0.010241826155811632 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b13b/evaluation/rankeval/8b7178b13b_5_lm-eval_global_step84877_2023-05-15-10-06-37_5shots_backup.json b/8b7178b13b/evaluation/rankeval/8b7178b13b_5_lm-eval_global_step84877_2023-05-15-10-06-37_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..76f82522b12f592b48bb6adbe292a33f8ac74bb4 --- /dev/null +++ b/8b7178b13b/evaluation/rankeval/8b7178b13b_5_lm-eval_global_step84877_2023-05-15-10-06-37_5shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.359, + "acc_stderr": 0.015177264224798601 + }, + "anli_r2": { + "acc": 0.335, + "acc_stderr": 0.014933117490932573 + }, + "anli_r3": { + "acc": 0.3258333333333333, + "acc_stderr": 0.013535422043417454 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.38723751912112364 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932262 + }, + "hellaswag": { + "acc": 0.44343756223859787, + "acc_stderr": 0.0049577508971529426, + "acc_norm": 0.5806612228639714, + "acc_norm_stderr": 0.004924424018073683 + }, + "rte": { + "acc": 0.48014440433212996, + "acc_stderr": 0.0300727231673172 + }, + "winogrande": { + "acc": 0.5540647198105761, + "acc_stderr": 0.013970093482330697 + }, + "storycloze_2016": { + "acc": 0.6937466595403528, + "acc_stderr": 0.010659088460112754 + }, + "boolq": { + "acc": 0.519571865443425, + "acc_stderr": 0.008738352682962235 + }, + "arc_easy": { + "acc": 0.6094276094276094, + "acc_stderr": 0.010011059112064243, + "acc_norm": 0.6119528619528619, + "acc_norm_stderr": 0.009999295905750666 + }, + "arc_challenge": { + "acc": 0.2832764505119454, + "acc_stderr": 0.013167478735134575, + "acc_norm": 0.3165529010238908, + "acc_norm_stderr": 0.01359243151906808 + }, + "sciq": { + "acc": 0.913, + "acc_stderr": 0.008916866630745925, + "acc_norm": 0.917, + "acc_norm_stderr": 0.00872852720607479 + }, + "piqa": { + "acc": 0.7247007616974973, + "acc_stderr": 0.01042142927736953, + "acc_norm": 0.7393906420021763, + "acc_norm_stderr": 0.010241826155811632 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ac9554c8175d7c8597742d4fe391edb899c0127 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4fac730c4a92198f0985ba1c7a733b40526cb677097f5560e491f5140f6b9f3 +size 460722583 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d330f584f8454e430f6b1899a2da07128783c9ad --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0285fd797f0989b604e9d8b8924ae91bda653c860543a4d22787248f5973f28 +size 460722583 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0d27a7e9e398b7efaedff1bfd0972234bfe54cf --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29ca93e7e612322dc63e1ea508648f7c7e6735bbed0db2ed9aa0a5f7c5ff4cd6 +size 460722583 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dae17ac11d5f941ed0221646f516c33bf22d8156 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6403b6b7e650783ce2c00aba1dfe74cd98eb5d6dffb60954482e4d487380582e +size 460722583 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_04_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_04_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..188a6131d8838276f89bc813bc4b545a7e23f02f --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_04_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24b7acd83a87c049067fbe0e68573c30db15edf925cdc7aea740d027116eb6b3 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_05_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_05_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20e807f8822cf6dc6b40e7f41a1aad61fa84966b --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_05_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79d8a89b0c6a7620890c00cafb197dcb5d5be7be549dfcb6dea6dcc760484bc5 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_06_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_06_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ef994dde27f5b76990207461b5434da92bceda9 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_06_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:032b796a96b05b0157caed899cda0ccbeff8518438e0015e004dcc524f051399 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_07_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_07_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7a36f111a83df1ad26d2e01b46fbc400dfd34ff --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_07_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50ce8668fb1564a8306e2cac01c71ca4f7ea60fbee5a44b7120df4b76352f763 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_08_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_08_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19f31cc35fac66d89c28873d3ed64ff2f1aaf650 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_08_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eff1df1691c0d3a3d1a755a9078aa76f433868aabaf36fdffee2ef8e9963f9f9 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_09_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_09_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f40b493c5de78261f31d15927f7274ca45d88b9 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_09_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:899ba36f401d211f5595b08f82e0b4344185e18cd60d8f48480bcb7d66b5823d +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_10_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_10_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cab3ab561cd734a3556b8cceb2f2e0966d729d84 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_10_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17e6310443280ec43c0fd921558931c6e4d633e09015343ca8902139348dd352 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_11_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_11_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c53bc92d4b4d6e0342d08d29415094bc6c7dec6f --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_11_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:892e920708619cbb4401cbad4782b8fb2b7d3a8ee70d2f9b2cd602fbd85c8f12 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_12_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_12_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72a48e9ac7bbcc3563ebc47981514c0d116f8417 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_12_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa9d6cefa89926cbc4aaf7cd97e1273ac232dbe113b18f686c850efecc9c6d3a +size 385183639 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_13_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_13_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..739efb74e866b641c15339ee02d5752e7260f475 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_13_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e526c7fa69105c3ef1a0be49ce94c4f72264e058151075c100b928254edc43dd +size 385183639 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_14_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_14_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec78adaa452684d07f170aa33b29a69614dcf64f --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_14_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63aa2961512eb5a78035ecea5470510d82f8f78bee505b30aea5abd78637aa4d +size 385183639 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_15_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_15_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae98f975a11c508a8e9e3625d0a31d5cba91cfc4 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_0_mp_rank_15_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4c1c8ec83bc45c54a9b1576151f0644cd6208254f5cdd23181b16c930c43d4f +size 385183639 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..872195fc5ee5f8118a16156eb0642aaef2e4fa3f --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e59151e9918b806d59bcb4f285b8b8eb0db699b514b147b67e7d9ce86fea18b +size 460722658 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0ad4b9d1aa2343d6006cfc545d6ec34bf5811c5 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c3fd6e809e0e1891c9f78e017511751ec72da9790589602bb9afff022e777b7 +size 460722658 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e140c67a3517990d81fdbe643acbf4b64bee0cb --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc69275fc0695fd7b790f988191dc26f37b36f36ac02536d607d75dbfccd5ea7 +size 460722658 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c91d0bd6c4a773e16c3407fd8fdd90083de2828 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47a35277138036f76d5cb0496ba5bf85e4be75deeb6b2ff909ceaae23883a6ec +size 460722658 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_04_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_04_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..311a36c4883ad614cb44dd7509d21c098789448a --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_04_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd1cb51f94f853f73904171ff27907374ecfde8c182461c4eda9afbb0be83d4c +size 415502754 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_05_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_05_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46493122091f8788089fd6dd18ae403aca105dec --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_05_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26ffe802bdbc359dba2c11b808679d4e484817ec43341bc3060c1401dffc8650 +size 415502754 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_06_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_06_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2dcbf04e8166d654865097f21775b8e2c19fc56 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_06_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f45cd87e17f6bee785d17e66a67d0a0653ae1b8f3fb5b2ae462e841801a1b7f2 +size 415502754 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_07_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_07_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84803c6b51488d8eec42a4f3d21c3bf5e6d6a508 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_07_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:527649d74297b46471f7bea4aa5244b8dec5913b7742294f79332fb26dc29bcb +size 415502754 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_08_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_08_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91236756c8105b1b0ff1809f28d07b8ad5c2fd6d --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_08_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fb9e7c4abd384005b49d1afac3e315959aa91f8c49872a2c3ac0f7a515fe235 +size 415502754 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_09_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_09_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92ea277d933c7dd9a83f02935aa3951dfa227acc --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_09_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fb96ef88af54de224e88943d889c972847968d4e42441dcb08409ce017b7f16 +size 415502754 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_10_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_10_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09553179c7f55603c1514700f767891cbb41d4a8 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_10_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8df15deb596217a955787342dc2195ec603aa720ed29ded89081fe7fb62610ce +size 415502754 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_11_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_11_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8092b60527439e0a855f2a6e24867d25b43497f9 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_11_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76aa92be978d013d0b9f2d616a8e2f906828b98d357c4be30e8ace4c2a144e95 +size 415502754 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_12_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_12_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b2e3043ab028912201301adcb6459258a63933b --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_12_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52ee2ba45b24f4cbe24df7d84fdf54a19a29b09c6f29cfc265e218bf29cb14ef +size 385183842 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_13_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_13_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1d99b3f95aa44f092a7f9798699e70f99777512 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_13_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5cba912370e91738ec86615bb05d127f13883da1fdc74e765aca7d21467b109 +size 385183842 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_14_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_14_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..865ce382737af45dfe430db95f6d84ab89bd46a9 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_14_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:646cc5c66d6a635710bd12f62694bbbde80c29555bfac98a24afbefffd2cd92c +size 385183842 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_15_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_15_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd21981df44d9822534a5e9140a5f9f83c2ec0b7 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_10_mp_rank_15_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c18a8688a620e472ad4120510acc8e02c0968bb52397601a4db19e0d4da3e2a5 +size 385183842 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a703a5d5a6d297e551c6573b028f59a22cace757 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ffeb2c4c83b612eff421a62e4f3ab3bd9c9bcaa6a84d8640beacb25ab90bfe5 +size 460722786 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9676ba9ec2f18e81e7b7917d40a6e5531519657e --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31af47b9c364832f80b041b6b16758eb89a48e6d4350721a385345682cf57dc5 +size 460722786 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab65f2c485cb0e9c4d5b18303cfdb243f794e1f3 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7a808a22fe9f15703ee135e5dce22fafd63b5ea7b18df99dbf8722df84d810e +size 460722786 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a7ac25f791002dc981a5ff1b23e03652d0739d2 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a280fa4dd384528457ca4ec061d75544b48fb54e1719e3fd2fefbe51c3bfc563 +size 460722786 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_04_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_04_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b8836f76f2b75343a0aa33aa456c2becd3d8cdd --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_04_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a94cc3e8699614fced624d0d56ec478a7d8ee74cdae80dac342314c5ff128de +size 415502818 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_05_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_05_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8613309513c33732ec4170cde9921a4630adfe20 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_05_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dae0e9a1af4c43f8b91f3254aa05169de53d2fb99eb01e4a23be200cf3d77cc +size 415502818 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_06_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_06_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..519a94f31540c7b32d7b6973d14b75b4d0fa92d6 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_06_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4743229fa5b441cc809cae74fe032154bde12b1a22985fbac794be718d9b7c87 +size 415502818 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_07_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_07_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07cc23d4a75371e2a6980b570e535a6996e5b2bc --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_07_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec7965baddf6df2a2bf3af451ec73cd5705cf672419ccfd94eeaf62a07a8abe2 +size 415502818 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_08_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_08_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae3f2bd1a0b58a86168cb0bca375fc230471b5f5 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_08_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af75dd7c59e17a1eaa9bdb8186b1dcf5d5467a038ec3590cc32276e145279be4 +size 415502818 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_09_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_09_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25e3ed65dee33a21e92fddd1f77476034599453b --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_09_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b545fe0f5e46837c273c06d7e1b3c64a48a2fdd10cc81e4b730f63922e9e1fd3 +size 415502818 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_10_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_10_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1388f4b5baddc37421f0da16c664642bffd4a46 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_10_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de1181685517d38758dc972e5a38a3583763fab4b1d444a88c5edaaf857c34c4 +size 415502818 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_11_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_11_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef5f1db0f8fa6bf4a94f073f2d740124c76a8bbf --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_11_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0fe7e671efc9008c8fa9ed2a49247067406f2214e940fd4d092229d072a2b3a +size 415502818 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_12_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_12_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fc11da0276768935e298c5655be93a785ef4578 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_12_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4799d565d4fe41a1f75b021ff7ddd59fae3d20a34fed18f44846eab159687b3e +size 385183650 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_13_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_13_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9559b4fc6e271d37072559d46a805e0a9804f897 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_13_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:349083822e3f9d6db9ce662cf0423501ecc96c4a9fd144f36e9c70baf705aff3 +size 385183650 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_14_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_14_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a1aa22baf4503004a937608c6928ac447f6b1ca --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_14_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b10b720cddf1960400d95b979d02e36ea6ca64a4e92af4e4f4ecd97d09278ea7 +size 385183650 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_15_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_15_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46edf4dfcc556d98602c8f0c675d1cdc46188fed --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_11_mp_rank_15_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e74eaa2b30d8f313a6950d8217d83c55b56578e14c067bf7f3c47e37c63f93c9 +size 385183650 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ed8fb8d296b69be21626000b7d16c9f06edce63 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beb89be6fcc0df13ac65e97b532e8bc507dd5bcc06ca44ab26601f7c6310086c +size 460722786 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b18b28e2ce54f5c6d2646522cd98a36751adc41d --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0168a1b721b2c4869b66e241a97583581155f77e7dc3966b91f519583c18563 +size 460722786 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..453e188b6fdb5718a0cef1f3b4fc9d92ca085851 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9159d0bf7c868f56a501d9a94e6ed5867e642191a6967fcbe322029bffe5027 +size 460722786 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd776f36d02c4eb65f61beaebc4afb4a73621907 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ec99b7cb79a4a372810d3d193b72b9348d57b1bd9ace4173fb5c1f9b33b7221 +size 460722786 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_04_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_04_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09892a9c2601692d98d4b651502d3574f543d976 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_04_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e95daba44db70304498a2c19880eec5dc611522e2b00b1577d3480ce1775b2c9 +size 415502882 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_05_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_05_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8740ad2fb6d47a1e9496af3dc0f537c27141ad5e --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_05_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9b0460a7ad5b7334b4d27eaf55b541023bf50b6c01ec8422585ee22cfbb6bc2 +size 415502882 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_06_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_06_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e70c44a50b294556cf683b5b827199ef20d723dd --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_06_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b1c962e5fd0e7d0f086added28cce0c7a308ffbdb527cf1d97e98307df279f8 +size 415502882 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_07_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_07_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69c419efce2c7a2d599092077c341393a95d069b --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_07_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbd76592c480b7f99eb3a85b016cc9fcdaa1a380d040e053541a39ab05f48a7e +size 415502882 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_08_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_08_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b62fbf4faf1122774b5b50c0ae990f6ed73fa26 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_08_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c31532ad5bc44da053fe09fdef66e928b762a6cec2bc4b83c8516cbbb981f2b4 +size 415502882 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_09_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_09_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e10ef7e5a814330e954188618c7eabf69e7269e --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_09_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:513bfaa0c42bd6b28f444b180916a6b68495235498f3d2369e82b972243df460 +size 415502882 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_10_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_10_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9db9cc37b94ce7acec54d66f1e7ed55efb4878f1 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_10_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:663f8352404327fa4f0366e2de46f955609ce17e100273ffd76fe13c0f072045 +size 415502882 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_11_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_11_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15c4e369932527967e45c28e3520a8d46f867bbf --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_11_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:440364093a5af7003217ab73ccda360c67156319e0ce6bc9b047ba08d71036c3 +size 415502882 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_12_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_12_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..289acae8b062a3415ee3476c4c86b9e810c5a9d1 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_12_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d848dfb69e54a390e4bde6fa70784f749d0739d4a3167a2b609745345c848bcc +size 385183778 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_13_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_13_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4509947fea4b44ddff427970b7089a1469c8f24f --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_13_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c191215ca10ba4e8bb6b23be1bf6bf3e8bed2674133f2e232bee00e7b643f940 +size 385183778 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_14_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_14_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8acba5b658f90112110b8ea91b03391feca32c73 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_14_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a61f252d0436de8b98ee2ad1a64c75610097fcca4a822971ab4356e4eb1c6650 +size 385183778 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_15_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_15_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..455986c8abdce899d3189175a7a2c2a690e8de6a --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_12_mp_rank_15_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5d3ea096283fd8dbb55b2939734f84b60b9fd188bc00c0cc2b51666ecbe965 +size 385183778 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51cdd7894c06a4937b488fee9fe3db8d33f5667a --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8440c551da3208dd5e6700078a805cad0c5b43fecb2e692fcc2fff012e3080dd +size 460722850 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6626ae876e85fe0677053c0d38cc26aaecbf813d --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97bdad77f02188bfea373e2cafe8aa2a7296fcb793351cef57b9c2bf74f1f17d +size 460722850 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..233e66fcb1ee3cbce984118e7acf700c35ec0979 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c75898c65f5a41e7b7109df90ff38d640c63e498b65755d5452ddaf06daa5e53 +size 460722850 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..475a80dcfabafcbddd626e6b885f9e6078f50cc1 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79744e8b234b9b7575732ccf58e1b9d7479be373d47f07964dad7deaced55cef +size 460722850 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_04_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_04_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57868b146cf4df166990c173229ffdadecab4650 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_04_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f16652bb1e313dd00b0b3dc81083844efb1e75d7a4b49478d8803f8631995d83 +size 415502882 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_05_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_05_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1a1da8182ea70fb29aa8975ca5f6050e0e60bd1 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_05_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:268a2838a90f47bbd82f144557abd91377f8b93c95c9ed4de5b5a7ec966e94d2 +size 415502882 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_06_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_06_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87b95aa82881d40b894aa8c6bfa192204869e210 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_06_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4866c20cb1ce003b421b54c73ee50eb27077412ac511e4e6ccbc8f8459d0b9a4 +size 415502882 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_07_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_07_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..836f2ba24fae6cba1689b46fbdce9e3eb520a0cc --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_07_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a23bd7ba8c07f4c0f0f96ca5ed3e634831702129759eea88fe032d10c039ad8 +size 415502882 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_08_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_08_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c54f6558770a53ba9a3e1c2d55adcc0b7e9a3bbf --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_08_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:743684a81e88a4e70da69f5528d11965a52e0a0f28584b390ee3bba9eb251858 +size 415502882 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_09_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_09_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f87e04f993d8511301d8e83c96f7ed2246c15ef --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_09_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7b619f53525bfa4a132c448308af586091aafbcb090ba1abb2faf4dafd68cd0 +size 415502882 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_10_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_10_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cadc2770be6ac01c15aa2ae8cb70a8ab30fe8cd4 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_10_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78f5fb15127a351782ff2d9dffc5be250e2917c8868d973af1a03a42a6cc686e +size 415502882 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_11_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_11_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95268051e376ed72d72d941a9704500a7944d8e8 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_11_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:498f14bcfcd28ab7f558a2ab09d341fcb80492ab630bdd2f2a01ecf750424208 +size 415502882 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_12_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_12_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a68a42778e1c4a25b81a294353a8ba7424e1c34 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_12_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d40d151bc104a3e377bb3c82211e904fe82ec0976849fa57241657fd1d1694fa +size 385183842 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_13_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_13_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1cfd8af229ec414c28b578da1d56b2d1d8319ce --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_13_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21270ee207367bcc447cb9e89ba7c0e73c5c9b1923b0b744224648df1fac0801 +size 385183842 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_14_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_14_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..207d8d18e410f286eec254725693a657b13751e2 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_14_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a828b089cdb8b19a496e43ee08d0eb410c73b44d31fc8379344521ee75af762 +size 385183842 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_15_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_15_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..194788a1267f6f85a98e34e7bbbe341215b01de8 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_13_mp_rank_15_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3b0944b6046431e3595fc9874389ce8ad9b512f68fc7c81475d5c6f90446601 +size 385183842 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7dbc318f67e3e078376836e4c9b1f7e00931050 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d5ab08189731221a82f4a407964418243136adc439dcb6802bf7cf2acdd1315 +size 460722658 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a9ba77ae217219ac022a33682dd2e40359c7ba6 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9d1b0acc22a2db3f0cbd4a38d4e2dafd07bbcdfc5facba01e443776853624f6 +size 460722658 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..279f6aaa029fc01868aee519cb0d04c32a4a0715 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cae64b2c053518969ba8a5272bc1afbd7505903fca5555e7ce58c7e901fa0d62 +size 460722658 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..622c765016b5abfc89c570a0a5222d02b90e05c8 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b16fbc3a4e5fc9cc172bdf9b9b2edd07c9aaaf6fa96ec9a7ac3fc21f3e8527c +size 460722658 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_04_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_04_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43f72764c4aa25a026c7ab5556792e721cc6fae0 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_04_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6030c5a1a40de22f8050c8cf472e1de97dcae1eefff2358e42dc34ab0b36a710 +size 415502754 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_05_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_05_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d80e4a35e9ec1f0590d0924324b881aa1fab6cbe --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_05_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea8dce27ac31a2a900d5f5bbb1680022abc1d01ccab20657dccc06151957d827 +size 415502754 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_06_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_06_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad77037191c0536c6167d69770ee6db569c58129 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_06_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97fe7edd480e97254f6722fd6a75c3a0fbb361ba476c76fb6253bf714c3c01bd +size 415502754 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_07_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_07_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a5369288df6741c381ce4e11640028a7aa32a56 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_07_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4f2af42d498129c7c46b45a9e0377ce942783cb19b4c5546638defdcca62401 +size 415502754 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_08_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_08_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77bf7935c521cad12841a80c276059b88dcae390 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_08_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb0b4c2654d3118c8e911261667e98064e8468545aaaf6ad31d69bb80bbec07d +size 415502754 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_09_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_09_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e9994453c0107aef68e6578d520d66551ad380a --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_09_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ca8b9bda62ab5243d2f8391588d0eda0b2582b0ad2db78626583dfee62e7a40 +size 415502754 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_10_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_10_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db8935cc447cb724991cedc8d9f5e3ad4932c537 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_10_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2802aa2951ec313303c2114e0cee04ce19f91740c825917fef2a66311e80f60 +size 415502754 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_11_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_11_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a292b72751c3f143a84f8c13d3cf0c33c9df8283 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_11_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c379a9cadaa8bf4228b2bad1c7011fcdfcc979d1941cc00dc217d7cffd80501 +size 415502754 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_12_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_12_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ab9b5a83c588e2b103b0d659a708043ba3245e7 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_12_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf42e9e9f79fb1432e9a9a8664321a654fc781c9b59468cae258f6893dd7422a +size 385183714 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_13_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_13_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da53fade35017270bc4dd1383d39b5a8f537e07a --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_13_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1be82105663623d1e0a443eec5bf3e35770b39686f9e95af383917cff3b4518a +size 385183714 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_14_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_14_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75886fdce551714a54d57699374e5e81d598d5d7 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_14_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b27ec8d941c3a4c5bca54aea7f7691e501c4579c244750affef173ffa66cf7f0 +size 385183714 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_15_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_15_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5764aed201acee5565c597455f139f9735511c95 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_14_mp_rank_15_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66262fcf85f65f91952b98518716d2ecfc8fb351a0b4f5474e9741b3a251c888 +size 385183714 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc9a1d521ad574e9565bef6f14a830f9d4889bcf --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14ede5cc16bf6ec7acde5a70f9c4f2639c83c80603905a4e121667344dc40554 +size 460722658 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12ad1a4ef25e5f71e4b897dd25b140c38f0db7b9 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32b15db0b57baabe54e9472256c8764384cdecbc7c97e936693f7f624c009595 +size 460722658 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1305dee889eb1615519ff3e3e24f53aa80b1ead1 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e82875d9d1d0addf635e4c5791d0074ed40306dd9f8b29d6d8c13c93d3ebbf72 +size 460722658 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0040070562d8707744aa043c6c2347ae7a30ea5f --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16cd39badf4fb4db6b40d9f0ca6ef6bd0ba8d9594d57ba4aec6f125c36ae2803 +size 460722658 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_04_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_04_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e79a2800c761fef2fad6244b2740f5455d46508c --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_04_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:374608bdace058b68d3926d41b00115f47fc30e96b4106f54caa00a44055640b +size 415502818 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_05_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_05_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c67e5742ef9d070417b600445ecc874faa68027 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_05_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05d66a715bcf03016be7b32b7aca0e06ef938d64eb34394a6e48934c8b9494be +size 415502818 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_06_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_06_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68aca4436ccebcc2e9a4385f6f18c4609986215a --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_06_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc51c46a9e4205b62d1bb0b49f3ca51d3a668bee3fc89df4873ffaa801f45d59 +size 415502818 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_07_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_07_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d779abd52bd9451208b52fcb43a3eda58cc8ea0d --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_07_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0215ed7216405fbb1be7b323f7478573f18fde13ff3004c4f75ac6669ac1104a +size 415502818 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_08_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_08_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..445613afb23e1089575e661755b6b2ece67093e7 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_08_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cdf2d75f4bfd2a60f0e1ed6146af7396398e75d46968e9dee2333444f1d3c39 +size 415502818 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_09_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_09_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b052ab47c981695cba87c5be51de41d41cf2f5b --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_09_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44b4820b6eb9eb6253c9b2c264a9d2e45b4c3463a448602116d59b1e185d6ab9 +size 415502818 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_10_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_10_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70e094a23528db7166fe3f5eb45263e99d15fc83 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_10_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:522f5d7ef675711dea7d73c874cf5b0433b66877661ab9559a94c05661778b9d +size 415502818 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_11_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_11_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f34106787ff50132afbebe03d32f387ac4b09dd7 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_11_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:394ec962b0f1242d49058ef3757e975bbca3731bd81117c02b76d0c17e28e345 +size 415502818 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_12_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_12_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e53cbeb72129d2f4dd13064877edf99f5032d1a --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_12_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7f94d5f022aece128203b3c31d7cf113b969ccd71c4c4ddd9caccd1e870b6c7 +size 385183586 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_13_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_13_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..408b5ce4dacf98adea468889f40bc1a423af5645 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_13_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e1d01df71d6c6ac1c51f519a3bc92b68ab68071c17d2106cf689df65933543d +size 385183586 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_14_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_14_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c254e4a6e718b00a1917a82210408cc0f22deb08 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_14_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b34ce654d79d4fa9cd7017efce31cc3e1a9bb132d6a075215058f0b05774f2d9 +size 385183586 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_15_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_15_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e28c4b3040d831cec5191b7441c0e60d5a47bd2 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_15_mp_rank_15_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ec1dcdb2631afd846e82e39c2d12eea837271fdfad86dd1e57066eac95b55df +size 385183586 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..732c3be68902b48f88e010409f5a2238b8391908 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59e9bfb2e454905be7d5f5df38c9402f761859a1d9aa5dfe00d62d55452438bd +size 460722647 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c377a8af18bf2960e5a8a5aca2b6db9f55743fa0 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17db71d0f7da7cb3eaca67421f45bf1cc6ee9eb4d1e3f2fc113eee3c84cfee93 +size 460722647 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e821aa91f466e14aadeafb530f5abb1bd5ce3e3a --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06402fd89ae5a70e619b89e4aeb166acae09827e210394ec9d8f83d57169997f +size 460722647 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..725868e65b0d618b3098667ea3046bc3d2424960 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51bb5485d3f5c3dde4f78f219f97718fe7953f9f80615f2548cb1bfe05ea71c8 +size 460722647 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_04_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_04_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97ae40a0885ada1595357e03e697c2b0fcb400b3 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_04_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73a2d9970e548e1c5e8890648ebc8cd860e1513df815d0a429a29a3894950608 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_05_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_05_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f14509bb91faefb0ec6aaa30918755595177070 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_05_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfaa301714fcc7502b2edd19546d484655053471a82e2ba016b57289c44fc843 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_06_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_06_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b15cfaf6cdf25cbc03e58b23671d55e8db8543e --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_06_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26d4ddf6286d99209556e733b852f6711aca039b5a65f20b75c92857c35fd5aa +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_07_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_07_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91dea8f600ec352903edb862192ea5a7ec770b92 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_07_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9484cbc8001b45207b65bad971c0a81f6a7d52a337399e2ce0c6531d7ed15ede +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_08_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_08_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..751cc4637b9bbe122a9518ed5cd820a88dc94309 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_08_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5618da70dc4c09147e8b46cc88f259d975663263baf2514c77a605ccbfd54cd0 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_09_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_09_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce91e9c9997804a2d19b8c1f0000a52031b296a4 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_09_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cae2098fcbe227c80e355bafa2f051000b5fa7ad8361293497e9bc56868f4f96 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_10_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_10_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba703c3924c0dece569f520a7be73953b2ea1059 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_10_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee977dfbeb17625528f11777a0f30cdf536f29cb08933b25e80e0a8a453b6d24 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_11_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_11_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..697414674059883ef1764f5f3a013404b4032c6e --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_11_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1931501878584c4379f3b7cb73a71607562314bd5d8808350bb11d55a27c6a47 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_12_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_12_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44b2e01bba9118528c0689f25e9e41d859e90abb --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_12_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52d3075612885fb1a002ee4dac2ef155f1699ccfb708ca0872f0002dd60b2636 +size 385183639 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_13_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_13_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c105ad63d3981285d1cd89704c7ffad022b1d848 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_13_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f9708a620c8acf3fffef04a0ee53a46a4c10b4d6ab762e524c3505af2235fd6 +size 385183639 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_14_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_14_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ec53fd779c18b0069d43090d503f2e51be462c1 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_14_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb864b5963df358ff71a96f2caf0924cc426e77a0ce981a8f6e0ba13d1f57e36 +size 385183639 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_15_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_15_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..efca1f8db0f65b2a13ca78aef4a097e80ea10800 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_1_mp_rank_15_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1477869237ae0242fb65ba2209368765a1acbf379356134aae15285bdea68b97 +size 385183639 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb85b0e5beb70fa590cdd55eeee0427be5d4a57c --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f90bb2b66f3ceaf5618a0ca798a45c83f53f21da0aa36f9fa140cf319030268a +size 460722839 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a3e669dfc3be3203b126475ff1a8fb753f2234e --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:639656a981457e4f5f02f260820e21b967e8bd9dd431de7a7967d55bb17b2ec4 +size 460722839 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37ec52ce4a40467b29fbe45f150eb8fc91b65522 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:420991bd8a2b46ec4ea5069a7e493043347a166a1d6a624dc92cb864c12a498a +size 460722839 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33700567e5a8090fbae6c8f0979ebf1af658da78 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65aaa348e32f81716c1be93ddff9374d21de3901caef2a5c357fcebf4ae8661b +size 460722839 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_04_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_04_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c76b460bd9f02b8aa44c4033566436dd95e8efe8 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_04_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:885b77ac273699991d4cfd978f9c9e852a5b9a154f6760676300851086661751 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_05_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_05_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e3c341d4c7a6d222bdb98528ef3e691f7ec4423 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_05_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:290333d96692b08995522801effc0ef39c276c166af0b4b5bf2aa4caea1f2ff1 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_06_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_06_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..52a15b073a5e576eb9fe0bd38044d5dc828c6cb8 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_06_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef77c579bc60e6542d0f0befb5c7867c87546d90ee8a56096498eebdf0eed8ea +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_07_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_07_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee7db79a90bc32fb6a56c29d51404dc26fb0c0b2 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_07_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b14cae86fae1ccb518ad848315e4a9201b8fc3186e1e510a7565fec4759992d9 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_08_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_08_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfb9fc22ccf1e9155da1076ca29779341272b605 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_08_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b1d08cc4d4557035bb42924a183a223bc1183f32dd4c70d2f6449ac5baa038e +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_09_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_09_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35375b695ac3a78ecf33b94a6e26ad36ce42460a --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_09_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a24a9f3d71f59b54fb94c4cde01a4a0b589b72dd2a4de58cc08ad45c053f1af +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_10_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_10_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d0f1661eb5506aadbabeeec2f53ff7d3167410a --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_10_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b127e2582c30b3b3e208715b63863b81bfcf2307c99b7082b33995073b3b85c3 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_11_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_11_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7c08d6edf227fb33e507aabcba818dabec79c3e --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_11_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2685220266bbef21d662d0ef9b0717bc5847dd3cd4efb2c9b1afd5b1700cc4b2 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_12_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_12_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..266c9d4203c194a6b4f3e2f632ca20ff1cdc78ec --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_12_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2803b433be4c0703506f45aecbd47cb17eb53c927f9b0faa8d0cea136ac7b696 +size 385183639 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_13_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_13_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..143a5cfef5127b107e9d4b89ec5fdffd98e296b9 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_13_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9377c541d6675832cf4591be741df939c9c52397da31be8a1a446fbe5104b7ab +size 385183639 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_14_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_14_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..051bf791ea5f69705c49974562d572a656a941b8 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_14_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af04ba0ce573590d44b36376dcbbb09aa712bf817a28f31898f3276b71b3216e +size 385183639 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_15_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_15_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..589a590b6ae0c3a79ac44a33f4651b8790c028d5 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_2_mp_rank_15_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:973977261ca88c1bc9e243341b379b72fd8eb05fc4a118a14d94e2b07aa71e7e +size 385183639 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fad793026497862aaebb50b9a17a82a592c97a02 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:616cab68212b384c75de9369bd6a3d62e9fabe17317c6797b4a6474fb212e4a8 +size 460722839 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d5c3e371fd38de5a2b8155a5073f9f0c2d58bfd --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40c32eff448b919a520ebd470055bb47221e92473ac4a0bf822e6fb75aa6f7ec +size 460722839 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33b82ca325a503fb83aa2b6f052388cca7baae43 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae2949783ca37d4f380279b47487f8bff6bf89af694efe68bf72790e767343ff +size 460722839 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d18d853173bab16837c3801ac97c61b85c36f385 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d7c6e8e26018ff6aa3f3c2bc8e6d63165c2aced6cab82c8dea722902d24d6a1 +size 460722839 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_04_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_04_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb7366c2ba820b73ef19f6fe78751a5cee1dc967 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_04_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea987c073d9148be9674f21c6903699c1fa4d24b51319c93f8a33e7bb6eb2c06 +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_05_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_05_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccdd442f73976cfa79c21e6c9d1206468231b54b --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_05_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf1efa3ffe3e39c3b8c92f64b550c2db0bcae57de611eb211b73d1b1dae2603f +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_06_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_06_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e2a3e5737f5d277460a47030dfeee54c81c16bb --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_06_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52fde3e8d43335ab3768b19c60c4e7fa89b8268b1b547d2a75ace9b9c6b3c590 +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_07_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_07_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eca36aa827de677559fd55ef69a4355a182e2fb4 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_07_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25891fe8ce7211caf58b988e2ec812bded97296eb79df11f2138d721acaa2088 +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_08_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_08_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5aab6fcf7afdfb7770033bb616a58b67ce6c2f55 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_08_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f538e398bfd80401d9ec6624cca61f071c93770c479c7d695f96eb5f0a6a6124 +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_09_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_09_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bbcd43c7d1472e5e08366077f92c6bf4377e88a --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_09_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2622f71f8016cf7c60c1b443f20f95d0266e3ea49dab92db6be3e06df1eb1d1 +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_10_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_10_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa32534e8713f624287dc78b6704b14c38043747 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_10_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b00e1f3c5e0d5b8723bcb212f40f19ddc94925d4b1a703deef3bd5fc40601df +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_11_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_11_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1974f9b169233c99a79d5a3aa0e4c5e64ff1951b --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_11_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f93d28c311cf81de60d642ed20b452eedceb3fd6a5d7b9bfa291cb0c8d0c3146 +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_12_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_12_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..52e37da43bd5cc7d7bb45700f0e665c6031754b1 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_12_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9acd278cb5609f3b68b1b33cac5efc5297219d7541f09ea99c83aa4c49a4a92 +size 385183895 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_13_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_13_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e404e2054c212e930a4c6c4e44158bd159b23ec --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_13_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a50bd9f45288f920b7093424ef5bfaa60bef1980890092ef920d5092ee03c9f8 +size 385183895 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_14_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_14_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8839f03dc5d87dcd8e640b6c067360121bfdf23c --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_14_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76b6227a5348c97489d85011f38d6e75e14fd771104fbacdaeb6ed849eee52a2 +size 385183895 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_15_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_15_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c3381bdedd80ad07d647a89859819079e441a82 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_3_mp_rank_15_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6946aaf8317f28dcb248c424d34af727b850d3163578d295a9711b34316cd2df +size 385183895 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d589ea2e3360e6c188abea9ca8edf7cdaddc9468 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65f8c6fafd3097ca3cd8eac6d2c1222f64829c95b7220dfd85b41979bec4c4cc +size 460722647 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54bc2c82f5d4d01f0e71bf462ad7057c7363f25c --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46d057403daaedf8d64bdd5eb8b4f5a7c538ff7f4997e04b1531b778978e0f6a +size 460722647 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdfe4f5886eef4877899ce90eec8cacab982d740 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efecbd2e05116db163de36e8ed2be3d9f0e02045659916ab009fb394c7a1edf5 +size 460722647 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79871289f603d067f4c4967ccd0c5488e35d9e8d --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d25d7b6009f22a5a876f9ab8cc51ebd10c867c2e51a788705789bb999369d178 +size 460722647 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_04_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_04_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0211d5c51cb24ce5c0aab35cb046bac1a347c33e --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_04_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4593d08d84a939b9ca4ee48f0416b2bb4698aaced63990dca79bd94e57f3cca +size 415502743 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_05_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_05_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12a4c181367639f005c95bc80ff51b2f846e35e5 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_05_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e96cadde6406b25bdb52e8b1553423a2e850eedf567708e1b90c751b8359a77c +size 415502743 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_06_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_06_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61452a6c1053fc7d7cdea2ee058dd9e2c0323dba --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_06_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caf0de42c6d4c686f054523a1950026fd50c20695891b8e7fa1c4d73be92d71b +size 415502743 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_07_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_07_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..763692c79daa104a6f583f974de4f30ea2a1968e --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_07_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f36db8081eeffbce9ef7f628f0b6717bd37383e37a5b3007e3a838901074c56 +size 415502743 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_08_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_08_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8b424af8e5492095e47224b737b5cefddab1663 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_08_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88b113363034f5429d08ccf539946ff3d1eb68873410338a976a1445cef88af5 +size 415502743 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_09_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_09_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51ea0159a5e66353f74a23110491bbd456c94a59 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_09_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51bbc6550ea3c5c711461c546e10c86e17a6885f48b1db6acfe8976c63f3027b +size 415502743 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_10_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_10_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0347982da60d3c30c9419ae35653b3dffa2aa3e --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_10_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e467f3c397b59c15eb70f44039512c68eac8517291022ed96eff2c28a3ec4c3 +size 415502743 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_11_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_11_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3a0305a13e5b99b8a4afff68fde1a4ffe2ac6c7 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_11_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3094f1401430fa039b436ffc5a48cc982988c42e16197aa7e554165f6ea20836 +size 415502743 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_12_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_12_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc8facc7334e6b7ccd5f8fc58cbaffaf8692457f --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_12_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fd5b5000879e0d7775737dbfd0e2ba239b6b24895ab4d79b6d18128df2c285d +size 385183767 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_13_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_13_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de3531654a19f6c0e10f39bc88c9411500d32afb --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_13_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1b6fe2d61410e635c106fa858edc8744145da8e8d67c662684137360a2d72dc +size 385183767 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_14_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_14_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97ae4efcdc16e8bf6f90ce37a1e5853ffda4d64f --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_14_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5949d9c0e81ccc6287019ab5fcd254ef912ff46b6010bc686476b01dd8d7d288 +size 385183767 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_15_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_15_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4248a39caf28e6bf790a8171f790671834688e79 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_4_mp_rank_15_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77d7ebf554ccc3b5bda26962f672a3efd5e069ae11c4023c24354f165db36498 +size 385183767 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0edcaadcd864b3a09eb3f5694138dd77f84601e --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c00f15f179dc1b619f576522966a9933da663f5db6b3eca6a9f2453d71248582 +size 460722711 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05aea22dc92d04eb93164aaa4fd6a62d907ffd83 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e89d783a5355df122c70f959120da5a4b9a98df7297640e520255c3e035562a +size 460722711 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1176811d6a50ce79d58650ba51c1742d45d3cac2 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:326cb6b8b1acbdb6dd3378549b612ed81d0edbe051cd5b9cbaef94b8cb8fc779 +size 460722711 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e075be185fa020163d7ed005b10ebec7787736af --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ac0034b3c5378b3b8b6d9d84c0acc26f15861c60f11111f0ef2836880f49c72 +size 460722711 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_04_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_04_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1d75df246e951462469abd056e655bba9786b3f --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_04_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e689deefa1caf62c09f1a27742e5caf54cb906c5a37c15398560052cc9d564ec +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_05_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_05_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3da487024a0fed01f87c46246d4167435738fb0 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_05_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9a01a2e60db21f4df87932bff2ee610aa06c54aaa4ef9c3d11831bf8b372c2e +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_06_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_06_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7593cf91dddab59dfa93ad8eb8e021c19b0548ea --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_06_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5324154f8add90e907636e41a7e9fb8a1c69c86ce6968821ddb400f798f665b1 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_07_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_07_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34d2811f2755b94779e4da4a2ae0c8fdffaf84df --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_07_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cbb25a3bb5c6e7a759b561c8c8c6384f52d2cea3f1068f0d24891074e3f3188 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_08_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_08_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47c0681f77d60064b72cf049db32ab367ab0e7f7 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_08_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5233070533ea579643392c87a53e83d0bd71c69c10fef3d188748fe1cc76a366 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_09_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_09_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2d71169536232b8320fe25f4582246c44e8dc83 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_09_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adb67439d0b2628ca42ca43a3a579900355b09b97835462e23519ce7db41376a +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_10_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_10_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d374ce3e33bb35508f59e5f3223f7db988aad851 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_10_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7979b7aee2e0d607e8cb7ebaae364edb6dcf24c4be9e9cbc6b00f7d3824a3727 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_11_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_11_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df0017d54f49e1dba78f7337e985dc1706de7d0a --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_11_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:079d49a5534c2e067d12eb54072d8e9f66f6ed0a2a590733fc99dbfeedb3ef59 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_12_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_12_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55539874070d2977ecf3faedbc300d08a0edcb6a --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_12_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c4c55da57be30117515bbb4c5dee070a33e58c736aecbdc6c989743cfb2fd32 +size 385183639 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_13_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_13_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..109840ce6c9c150073c001cbd4c67e33554f2b3c --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_13_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c8a7c44bb43c0edd8a646387fbd8c02633e1bd3113f7c9669ec693b47ea1a83 +size 385183639 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_14_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_14_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a42bcb77eee068b19cac94fd6537dbc75e9e026d --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_14_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3567d34953e8bbe5b85283864775dd8a8733694f5d89a3ec8c3c7757c2f7ae7 +size 385183639 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_15_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_15_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d76f86df1feb642f87fca5c09b75f7e72750d3fb --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_5_mp_rank_15_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f26f999fef2acf910d968f36348a3dabdf2aced445dffe9196b23a972464cd57 +size 385183639 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09eb2ad3c55094a4ae1839bda446e11cb65ce472 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a84b67d4eb2a0c15d3f673934d537c50cedeb6ead6fa2dfeddb245dc68830862 +size 460722775 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7058494ef66cb2347359f7c788504eee7c7e107b --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c328b99bc1a0e8059afcc5416c3fbbaaa1895e3308af88dc79021c2634c7e8c0 +size 460722775 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fab3a753f613551a3a4224c49baec2be53fcc2b0 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e11d7ba57a2cb09a42a3fe5bf64e8fdf92b3106318a312a687ad07c2b70aeb27 +size 460722775 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d59587ecd02f4346d29261be1681c0601ccb984e --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:283d4dac1455d80142f90cf4d40f4aa89fa8dce2116eeee534ca56771991f320 +size 460722775 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_04_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_04_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8180d1bcb76f67dc6b70afd39df2e2ed2559a450 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_04_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07597a103481f4322906dad5675385fa298a7e0ba3bef80436ee33a62640c3fe +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_05_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_05_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b192cc7f1cc1b30fe5336b3cfb54b4aba483170e --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_05_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eabd9a110a979dc475d8504c909f99d97270b9d433d760dd9707b7c525e2d52 +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_06_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_06_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3baaf9d2407aea8400b34210fc9be9bd5407d216 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_06_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d5485e0d6cfa28fd72331e12e7692421948ea63f00a0b5302c48c54e0d80a7e +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_07_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_07_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3dc575274eaba6ea6d35902688fc801baa391b9 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_07_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3a06414977b37718bc9fd5473ce365d88c037c280c8e883f2eb3ab1e670be3d +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_08_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_08_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bae31b1429a6f9ba0cdecceebbdc14a0ee15c8a7 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_08_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1575fca7adc5c0a6a03a7d93c7b1afe1b21e1a99bc9cd1b8a225a8fe4b22c225 +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_09_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_09_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29be4ed4a913f4bdc10af48a019c244b641fb268 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_09_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:802db3b8ae4fe85d3cc907f8f6871143f8f77cdc23af1757a54603f05c43e991 +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_10_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_10_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83ffbb63bbcc7dbd0dfae2ece91b877c77da1e16 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_10_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33129aee84b0cda7b1a233bf86756b7405c50ab53311cc41a23f7c464bd7426f +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_11_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_11_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8aea3bf113572f2690f299d59564e861251e6843 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_11_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1cab0d16df1613c9d74b5e3e5e88f40fc00b7c85f8b5c365e3055883b938da9 +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_12_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_12_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c5c56efabd5b86722c736c66a4eb0dc49257945 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_12_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95d123f4b5ef641a265875d138d2dbfb6ba18f3daba2a9d8673f6a25b373a9af +size 385183703 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_13_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_13_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e304e1707edb9b7f82ce60aa1762f136646af64e --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_13_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6bba932f567d101a847aeacb75ce21914a38ecf664dfcbb45a80faf706ff058 +size 385183703 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_14_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_14_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0442bcedb64f99e223a55cbdbc47dd359019bf49 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_14_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ec2bb097f5a400eca32c3c70a933a36eb21e1af2c6c6e9b81282d8da7e45fcb +size 385183703 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_15_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_15_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cff609d8edd6e1a6b4d5103d2cd9e1257a0dc99 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_6_mp_rank_15_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9e1f70b31ae8ffd84e7acdf1aa9296b5ba899d8c4ef808714dd478eb4450f71 +size 385183703 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4fe3dcb0b9822d5f53dc4d23575368a8e7aca0a --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:350399120abb33bd541583c667f2137c3a27433b0bbafb9a6496ea761449eeaf +size 460722775 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57a753597a21b125505843a03bf61fbbe3b698e5 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58e3715786494df60708cf70a8f1940758c63790648733b724bac199f4195f15 +size 460722775 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e0e267d73ae775663b4aeb1fc4cf1a232a5e2ff --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4527b1f89aa2c9231229d48088ad45199388d63b48c4be39a3ffb7e8db9eb2a +size 460722775 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac266fcba9c8ad8285865f225e50fd8fce8ff741 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d0f589a3ace282b4f46c8278e9be448d2ae468db96b07f6f61ad1f3982c451b +size 460722775 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_04_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_04_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0cc64ebacede4c3aef768c3f71f0264c7db474c --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_04_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:894c78f731ddac6326be933e3e83a27d6e1ae8304c17191b3afda6f5abc89a63 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_05_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_05_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf398fde12c7969febe6a5aa4d25e7033c648fe1 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_05_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cd784b28cb51db6cb40fb06b6efcbe56f0bb108f1c18c6766e798f670c88e44 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_06_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_06_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b05115b24e1c35ef9bc94eec0eb891e8e7fcc13 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_06_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6896d328cd43d78f122438786704d5663d57c2d85884fcf7b2f91af0f0e6ddbc +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_07_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_07_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09420afeb6707c944fdd4d79ec9359438e451495 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_07_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9cbd8f15e4a45fb37d7db62c19408febc68a51c067e810fa23d04c4ddc67bb5 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_08_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_08_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d26a17bd9c5e2859b2f43a5746a83ec481d7eab7 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_08_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a5fb8ceac354e0b43c0455c1024a243dee2e5a650e616e5c81cf5c9bb23d5f2 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_09_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_09_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b4a0a7c7aed64b50857b7b23c3b8a436802590b --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_09_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fe68ee78576ba736fe9ffa62b636aaf710a4c98a306f43bfcfb55293c9b4bb1 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_10_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_10_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e02b4d8a884e59e3db92b23d522da989acfd642f --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_10_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e040dc41a63c2b2205cf5be3a07a9a9d8e50d2a5a1154b619cc07531561ea28 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_11_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_11_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bb956773da5de0ce74b5fd722050d49b44d1ccb --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_11_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:635ecac16d691afda2498d15cda12267ad44fa143b02c9ee6481a034840f713a +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_12_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_12_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e674fce9527c5ebe116429cb1eb2144c5820de3 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_12_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5154cd09cf0d3647e84496670c670c1df2d178337957d5057079242f24d26234 +size 385183767 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_13_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_13_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79aea79aab0b3b74e7818dfd0675fd6b9730a0ca --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_13_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:396ba0e745dfe12c85569e5e7a0e9576751e258cc33b795a8c59c0502e7a26f9 +size 385183767 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_14_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_14_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2680439cbbff793d7a40a1132477d647884f6814 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_14_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b7558a95485170b60eb295dc54c7bc836c87c8420b27cea952f37593dc26786 +size 385183767 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_15_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_15_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc0d0522f054bfd78ae3bf42ebb566e4882b1a7e --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_7_mp_rank_15_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b39182fc37b095809e8c69f234a39b8a80a343457a80b9573f327da9b2020b51 +size 385183767 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86b5a360b64f70f534ba7e6836c7cbe91682f0bf --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d9ddf5214a6410f4b98859da19c58a0b5b3fe092692fd8a4b85dfdf71e655a1 +size 460722775 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6d9f03d2d09420ea9d17a8259cff5b1546695a6 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11d33acd4d49d7dd0a23a9f387f0ea45c1ea112170417ca955ae19b91abc432a +size 460722775 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e1b9eb94ee7c61bedc9868bd7c32507a9dfe781 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f801654bcc024a4dedbeb1fc7f93b1c909038ffed549045f4841de76e0533d6 +size 460722775 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1b9e8ff215b549f3ccf26449d5c5733eda559f3 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25667605e85bc13eabb012c173c9743d6b20ac55e7102b0e09c507df7fcedf22 +size 460722775 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_04_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_04_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a024094c36505b77d26a388b91d75ddf78c097ef --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_04_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33216a7cf32e08d50b56d216494b56c8328932c4bf469c4e0b09f4dc34018b51 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_05_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_05_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45163c828ba0a5b1eb8861a0a244441a4917987c --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_05_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6177b644bf83df19ea70255d2f5261d833a4495280b8866ff960dfb0244d33c0 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_06_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_06_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c9c1e86df45808714796e60f91c221e6a5e02b2 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_06_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eae6660c94447a5b7e2f9ab37f3f653346c273e3b1bcf46eb43c2ffc1eacad0c +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_07_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_07_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..caf724743f55a93e23f658e9d22015d8774c6220 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_07_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0147f59f8ceaeec59ac30b095a21930bdce343645712a43e52280d826089c86 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_08_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_08_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0adbd5f50a91f4314973b3c68162dd059ad41b37 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_08_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c46bb69f8cad06a10835c34f38bea65c6afb76081e1451966931e22b2fba87aa +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_09_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_09_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59e1f41e91656f08fd48ff836dda7b9744b9fa3b --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_09_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9581a2e27d93f8c8a64bed53f6b680f15395a6622e5df52ae52f39a1c9b95806 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_10_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_10_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b213cb9d5e522471d6882f7e7ec91134da12058 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_10_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26bb49dca97c02f8b2e38104f52e96b9eedf031302b4d0c8f01ac406db76f8b8 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_11_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_11_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..990cbdb6e97d0098be021b00be35b887646d7719 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_11_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1441fcce49f49e4f2975bc9a7a97bd294de6060541561495a8257e4b0d3a1ee6 +size 415502807 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_12_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_12_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e3a0ab9b0ee73637f31ec94d8e83794e01ac6a8 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_12_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acca497b4d937ff17af6385c7f62e84b0becb11e939e6b87733bfdab72809df2 +size 385183639 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_13_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_13_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0020cb472393c4d21ef476d00ceab728998e6b0 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_13_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d604d24d24e3ceb9b260a5479e69f0015455c33ac2036600b644b6cca74cb9ad +size 385183639 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_14_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_14_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcaf9fadaf6b8e278daf38b63e582ea7edffbbf3 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_14_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:796b4bd5d71a48f14b4caa2ae1004819275ad15071f650b92a262876b778b665 +size 385183639 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_15_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_15_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa048f2fbc20bd36f123c3adb9593aa691f33a0a --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_8_mp_rank_15_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc1c58c785e886a7f695bcc7cdf774d735182f5421b5d24e55f5df6580293557 +size 385183639 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2559dfed4c545517921143a9d07497ca9f205577 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2368958d0fa6f5960caa5ce2b66261f940d87c76ef40246b2eeb963cf992c3d4 +size 460722711 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09fb47f5d0631244c53aaa7e9ba8cd9b648e7195 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f864164aa165f0266fa04cc5351b92f80ab9bea0a8dba4044afa7c9a3d05ed8 +size 460722711 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb93abe444098074248dfc4c5085175f4197bde4 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a1938dc3cd72c5d989387d977474a393fc65bb0e3dc0147a9b112f8d8ac7d35 +size 460722711 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c997a633933e78d39453aea38b34aef71f1c9226 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:544e4bda5b65607e389aad073c2fb7d66e62183eda67a2e6558faa98808eecee +size 460722711 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_04_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_04_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a368ce5b0c08ef9edd0fa13a7f3244e25cd55634 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_04_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6be674abc7d9b01e8610bc5737ca8f83cda63956cbefec67bf0ef81710a489c9 +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_05_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_05_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb4ec0ad8754ae94a0b66b7b72e218c05fecd0d1 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_05_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43f367b5dae7a186073569f3eb986d37dc29db21a8e68a25f0d54e7967225b2a +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_06_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_06_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d0711b2ceb9a0b4e1c15c8ec90f4e98aa651ae4 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_06_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:997d7172638fdc2ef33ae600bd7ea5d929de114e628af9ff545ae31ca5edde7e +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_07_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_07_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec9c9f53771b648e21e00fbf6d2957200af17bcf --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_07_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44814729fbc7d8389984b4b38d9f624081780e2606044ad17d4cdaaa8e27dfc4 +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_08_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_08_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bb38ca7eb00690b20dfad61f70ab96c3c6e97fe --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_08_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67ce19af74a47351192dd7caa769cd88fc1d0e564a464817e123697ec94e2070 +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_09_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_09_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02f2a09bedebbb506b92a410e7b66156fc2b75ae --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_09_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be9d97484816b7eb76abff293a4de8b4b5201542c387ad4bb46a88e94cee266b +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_10_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_10_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..744e97617a63aa954ff9a0b606f5d9d1a27ab932 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_10_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54388564bd0b9bb547ea230bd58b719c4bc7ee773d75e2f9a7fb666d00825205 +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_11_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_11_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e009f00ededdf618aad1ad6d4fb3acdecb06e74b --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_11_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea3f4f2e64fc6fd8fb681db39fa27867a830c0ebe24add67f0410092cf87d168 +size 415502871 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_12_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_12_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8ee811d2fefa3b4829f156a08c1f8867b3b133d --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_12_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46161922be9da5eb1f9dd7d5c43671bc049c84d1ce34d70ffd9f7cbc29a9d155 +size 385183767 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_13_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_13_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8efdd6c09827a9f9ef74a90f5d381e6007fd9168 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_13_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f502c5b793c6bd45bfce34a1b869042df5b656a7f7b4b043b26cfc30892e7e1d +size 385183767 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_14_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_14_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93f83c1f8eb51d7958aa04d1d17916b216eb2f83 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_14_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d055f86e15fdccc2c8742eeb2d904e6e92134c804769d54c9ae67bade69af26 +size 385183767 diff --git a/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_15_optim_states.pt b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_15_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74e5b5d07cd75222f534cc8d2cc6b229ca2542c6 --- /dev/null +++ b/8b7178b13b/global_step84877/bf16_zero_pp_rank_9_mp_rank_15_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61b8297b20c4a6252fac6ee4de75f0d01b88b9f5164d3cfc7f11216283216516 +size 385183767 diff --git a/8b7178b13b/global_step84877/layer_01-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1426bf50e0ca0f0f5adf049320b990c2d782b9d --- /dev/null +++ b/8b7178b13b/global_step84877/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c3e11cf75b9d2e6b57adf2f35dfba47d328805237c0ad8117b83cd36a545b26 +size 120587523 diff --git a/8b7178b13b/global_step84877/layer_01-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b844d40b9106f7dd455c9cfcc6374b949388f44 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2699c8ae00b3f5957aa43ce9d38a7adc67e3aa94505b7bdb5c73c7fd266e239e +size 120587523 diff --git a/8b7178b13b/global_step84877/layer_01-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_01-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba3300024b0c2b26c65ca732d8b66723a83268b9 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_01-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a3c0f6e02cf946bb85151794028b21b04919a93c89c93860b7f2eceefce88dd +size 120587523 diff --git a/8b7178b13b/global_step84877/layer_01-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_01-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71119f8d7ac3bc3998270febcb1530a73b52c6f2 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_01-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5bf4984caf907da820421ab49041e03cd9936eef86bb0184604be4b64ba4316 +size 120587523 diff --git a/8b7178b13b/global_step84877/layer_03-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a47f39bf377e30554cb9431a808bb7cfddb5859 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aed0cca86260b74bd76361f38dfcfb9ce69a7074d3c2499db1d6adbc5eab12a +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_03-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2370b012a44e5a30a7caa016cc9dc30d73ff6de1 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c13a3d3cb7d55809891475c03087138ebcc9c840692df24cb4ceaf9bcd05661 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_03-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_03-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4d3b3432e753d9c20754c6acc9f3a877f973c81 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_03-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f67a524c15cf7bf56f488b19cdf696269bf2e4cb8250e43d7e83600a63b6751 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_03-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_03-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08d1864899279a08c6665d6b135d20dd6d92c79c --- /dev/null +++ b/8b7178b13b/global_step84877/layer_03-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a1e7a6f8843927eaf1f3fbed5b842ec779f979e1711e40f77874fb576eed16d +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_04-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa8ee616eddab2896358925eff36a0052bbaf2b3 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5e0f6ba57aea173d7448802a088b16fbc5f832d6e0e43fb3f40a0a1f6afe3cd +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_04-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..011a8d47063c50be9e64fb9cfa74d1dd9e863e95 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c1eee9c10ca0e8d5ebd42772bc58f9c100a7d54d94581b47c0f2a23eda68fa2 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_04-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_04-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b8db6bbf53f8d3e9c834e7a6694e61ff086bef7 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_04-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffca2d63432a29c160cea3d79227b6fbba2dc8520b141f1f57ce2bd9eb4c9a69 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_04-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_04-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..391fababc9654c46617ec6d05d2a704fd4134033 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_04-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7df49c1b7dfce41d00673acb937375330ce50752fcd3cf6071d79f174472e5a +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_05-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f82bf850d5114241bbd5e66f185ac8d65396902 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb795fda669d4ef1faa0cc77c7922e3447c4904f45a5ed40690617de87d38d2d +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_05-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d834ba65aa8919165688157fbec8080e5ddc234 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddddf103c770941da288aac2fd9a22b7ff02867b7683e443c7f5a2f86c200880 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_05-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_05-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8618b3507007b17c8c0d2bebd292adb1b7a02a2 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_05-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cfb7c1a8a93217f869ee6382ffb9308527265adb533146f6a2b025411fd2f70 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_05-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_05-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bd6cb711ff68464277df02bdfe99ba67bf318e0 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_05-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b315a00098b2dad40b8911b2f66cb7fabed8d399f8d992789e7ec694f7d2e62 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_06-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47c1b392502586086e354e95e2b2ddd6e6429983 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69a8cf111812982856d454bc6da813dbb79aab192dc39c6641611bef0d555a1d +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_06-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..feef11716169be9394b65333c594adcca1f0ef44 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e9e8036753e15bd0e305c109509ecbf68836062cd372a4827f32e48fd28a2ce +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_06-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_06-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a14740c7e197ae4c7f1f926ba04b04e3c3b723b0 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_06-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:075b757d13954c0e51a06164b6f6145454cbc3c8a1ecfdaa05a560b3d32d2513 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_06-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_06-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f2b6d2b988a324c395edf0118c044d9bb01898b --- /dev/null +++ b/8b7178b13b/global_step84877/layer_06-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a141a0600c97a1f069f09980bbe5f0ad929c3c543c8d433c153941bb24b74046 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_07-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0eb6480b31a98fbcf2eb5852f5d28e6e8cf17fa3 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bff91a9dd23680579680bb52a11a03e40601310e3aa561466b58ede8dfdb9852 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_07-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b049c1e98fecf8c9cb6513b137a88152cee8b08 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3b3fb46da24b305f51247c9d84721cb168d680dc703abe939bc6cc41a096b72 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_07-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_07-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42c452909fe08ed64875f1dafaed45360dbc277a --- /dev/null +++ b/8b7178b13b/global_step84877/layer_07-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:693a1db1c503f21779b6544bae5fa81cdd8b3a957f030875bf4c2706fe5c7894 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_07-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_07-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb6577bcda2f567f0e2834313d476193e16002fd --- /dev/null +++ b/8b7178b13b/global_step84877/layer_07-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06376c7aab2abab3ba1d14bba47f609ace458f29fa548bbc11ca17d2809f2f35 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_08-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02be434eb81b745d2825f0526f1154b213511cca --- /dev/null +++ b/8b7178b13b/global_step84877/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0bd00145fa731c95ee5f47b47ae0608b9218a024fc648f6e98bf19abf66aa19 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_08-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cefd410ce6fc885ee0764c786992ff6ef7236496 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:941d2e2e73ad206f24b9385c17a4a6fd88ed06ead5b56f200623a2998ea7c2cd +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_08-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_08-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1aeea0dc3ec0b6e4b9b78c6547c4c18a7a33d440 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_08-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eab61e0fe258741d493d6c2f46dffdf43f6aeb385e17e7118719bd6fe1f2eb6e +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_08-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_08-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0035a588c2fe936a0aa5ada6ff6884c786f3ed48 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_08-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d581b389e05cf541a007cb64a2d660a3ea04164249fea71fc7ef2eafbaa7643f +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_09-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..272290f236728b6788186e05c4e214a105a9be7d --- /dev/null +++ b/8b7178b13b/global_step84877/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07182c0624d54b59689e7920875da2eb2dbeeea70ca28f50f93d1bf2b2420e02 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_09-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a3f6bdb224cf164009855c3284b128cf3bb36d4 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ae2fc31ecd454ebdd06ff3d501bdd9cd6ce49b8fe71efb9345b3fe4df136a88 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_09-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_09-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..214d25cb0cc4ab6c9afa65d79696db9f7bcf452b --- /dev/null +++ b/8b7178b13b/global_step84877/layer_09-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5e575d633fd39cdefc9144dfc4eed3ae600a2b3afa3af8e63ef63fa0e9e8ef2 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_09-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_09-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e540809950225cbb98ae7e88120ecec8a0bd632f --- /dev/null +++ b/8b7178b13b/global_step84877/layer_09-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f818461441b2344508a2907c9966e6f3099f5c7fa1edc535b7b01b13888a8240 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_10-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5887693078afe6f61f71010f99e4cbe1f28f015e --- /dev/null +++ b/8b7178b13b/global_step84877/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de76ef7a9180571c095deb12fdc5f24f4d105fa116da7b5411d5dc12ecf7fff8 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_10-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf78cf63809ec706ae08b2c114a4c7edd36dda69 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97e3271f0587d92138cd55945ddc3a660f38f02c0c2dd143e592bd928cfcf5a8 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_10-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_10-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb8a3b14efa217a6135d2233bcb6b6ea4bc73a72 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_10-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b93f0640aafe89bade2469835649bb31d70ca7da2b58f90a773ec9e718372b83 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_10-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_10-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd944281b58f4680325e9301fe4e5d69a14ba122 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_10-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9a04c0cad77eb6306e30d6dbfca9c2c49de40e33b2b9cf63e65fb22de533b0e +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_11-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..584159f6179ee40266e76ccca457e8697426af0b --- /dev/null +++ b/8b7178b13b/global_step84877/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1810345f30d7f4f7c00980a2119e755257584a418dfa4dc8c3c2901950be408 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_11-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc348513df202667b95a5b126d5cbe65f994edd0 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f92f283511ca56fb8f99b8d7993135277fe124aac835690b91edbc3af43eea1 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_11-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_11-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc289f31e39408b121f6814a0a03d317f7d33831 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_11-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2b79e21a447f17418fa425d9836df964388d768886d066b6c6f15965b7ba6eb +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_11-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_11-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5374237ca0d400c249b2c9f5073d0849ac13d448 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_11-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65681df413234e3f48b8f36078d2d0633086b3cd65f72ba18d42e9f3fd2acd8c +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_12-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2292b6681b5266ddaa88005be40413ee9b864e9 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69fccab9c1b56973f65176540e72276e943b2a8bb2c9395f4ce4e2a6a76171f8 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_12-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ce5b0eb0459b8117423145bfdebe0a02b85fb91 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b676dc79f0915f7fb839146298fe0b2df7bd7ca413af0b4a3f1ac8ad96e3291 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_12-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_12-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69c8d87f131e3c38a9752335668a03e91b203881 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_12-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec2a093a7c34e90c0cf664f7f898408042cc041332bfc77c97c60ff1052323de +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_12-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_12-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56229eccbffbdcae95ca52d5beb6597ce0cc6d54 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_12-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c6f1fc33bafb9e61e74a924cfa25a49c14db0e9b8dc43dd6004eb278b8a5f69 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_13-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f408d990e3a539bfd66619f0caff91ef9631fb2 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfb0dab0661aa30801e5b7ad8971f31993bdc35f2250706615afcfe8c1d1880d +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_13-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f0fa2a4a647b09037e672bd59b971312643cced --- /dev/null +++ b/8b7178b13b/global_step84877/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7d4f0a2047264b5c87d067ef493ca18cbcce2636cde8a8af629eb7411f5ab80 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_13-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_13-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8550dbdc706854516d86bbd8fd70cc083e8dfc7f --- /dev/null +++ b/8b7178b13b/global_step84877/layer_13-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:403ef40ecfdc92a176a1b093a3f415dad773aa30f1d7306b6686b0beb2c51e17 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_13-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_13-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96da68d392e408162ef9c9cd8c81a407f7cfdbaa --- /dev/null +++ b/8b7178b13b/global_step84877/layer_13-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4301f6b6b616dd5d0c28ff8c054c8fe0aa310d751bcdafbd40e3366401f9f72 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_14-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff458c7f45c2ff9475b5fc6d91389ddef55417aa --- /dev/null +++ b/8b7178b13b/global_step84877/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfa6225f83319aef692a5683cd89979192e50f637d93cac1e928e83bb5c52886 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_14-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc93cbad1b421181459078a0caebbc30a1b35394 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ec5038d0ec52affdea3a249957ce4bb1658b2f90129f400558d4a663b294d4e +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_14-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_14-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbc25e7c066a12ee49226b94dc2ae7e910e96405 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_14-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f9922e0b4e13428b7aa86462478d3a12a2d4879edcc811c5ed3c486b0e6c6fc +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_14-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_14-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4eb1b111858c16243d710824bd1f1f9dad70b427 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_14-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6814d630771f483b158a54ebdc0d56a3db4fb12b248e37aaa91db8f304eef40 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_15-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a23f1ee11c5e31d8376d3f6d269c21ec6f82bc72 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecf736f6087a15dff88643fefb6f0036599418c67ab1edd01cd2ab5ac4702f92 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_15-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e774d8db8640b3c9457620b29a738c0df8797b7a --- /dev/null +++ b/8b7178b13b/global_step84877/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10643e68f3c320c0fcc3a46a14fc88d19f9c8c2c88b01484556230b9c27b4bb2 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_15-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_15-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0a1fca8d8975568e845274113fb39394e6ff718 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_15-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4b9e8f4ac725cef57d83013ee24560b5c5b6b79876645cca92ce089a1a483c2 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_15-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_15-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09fde34900b8f2285c1e8c6f1ac121869cd1cfec --- /dev/null +++ b/8b7178b13b/global_step84877/layer_15-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d0c877bec9428c105b8bd6a671bff95f6d847e1f3bd4abeb714835f8792712e +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_16-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f83df96b949363655f30eafaafaf610d5963e3c7 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fad84f90334befd29a100f5246ea7a889b90210489986f4495178a5153dc3d94 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_16-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46587c16eddff473c3af67be280ef954c64b8782 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c4668a6dca7b99214ee14d8bd4f7c594f7806cb58d7aa6a61f48f8da2b9c9c6 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_16-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_16-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d10e97aa3271ae2fd182aced8947c28d482f41a --- /dev/null +++ b/8b7178b13b/global_step84877/layer_16-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1964ced487f8cc3624968113f428b2623f3cf0843dfc066e32a040fd4698244a +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_16-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_16-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b5c3dc44bcb2840c42e644d45748de155ce43cc --- /dev/null +++ b/8b7178b13b/global_step84877/layer_16-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cfb8b1cbed15c958f94f28006c14f25a22d3c7e885daa5dd18caeb5ce54d908 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_17-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0202cce17b4d88f0981fa0a811519e91319b8b06 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:168780f9fd9fe803b45a922102bd73229767edbadd3feac7266de16f0645f83a +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_17-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b656bbacc405dbb9a956d3b11fe31d6e90d8c51d --- /dev/null +++ b/8b7178b13b/global_step84877/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2690e2020977db7fdb86536116e56f61132cbbb660a274cb5103441e74923b62 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_17-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_17-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb4ab6adef9755568ce6cf08bf772fff4ba002bb --- /dev/null +++ b/8b7178b13b/global_step84877/layer_17-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57c8dde5f21f8935ba4005bc36118514d2f5746eef83519c6bbac0345c4b2a1b +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_17-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_17-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cea4bc54640fc21483da8f47d9a64e9af8fa7a0 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_17-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d74a7c849d56138a5f6a5d557e036eb3fa7987e164981a8537be4daecf2d9c4a +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_18-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e45195bf16b976fedadf592639222e787269aff3 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2cda7c262b2334f67ab55c0ac733ae0b3ac3e9f0d17c85dc128918d0473ee28 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_18-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d98da1f535bf79e56235667cdb0f82e43d81f98b --- /dev/null +++ b/8b7178b13b/global_step84877/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d91061119fef8fa6b98ac1045898775fff11eb90184528935d0b05865d0424d9 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_18-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_18-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6c44f8c454c0eca9b3f5dc5b36b42706d410d0e --- /dev/null +++ b/8b7178b13b/global_step84877/layer_18-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6053da4ca6e2bbed9664edf5715868fa4865d4369434da8353322972c5deba29 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_18-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_18-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..322d105576497d278227776dac8e0b60e1c0e19b --- /dev/null +++ b/8b7178b13b/global_step84877/layer_18-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4302eca37e857fd75c4f91cd8fd0226e0cf2964b513c7cf4b2e42d9f5c94b2ab +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_19-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63cb90e8d7ff1f4fa32226ffc2fab5b9dcdbcc1e --- /dev/null +++ b/8b7178b13b/global_step84877/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d1b86cd51c82994faac43480c1b139eded8e00b2e4d1e249f240fdf9a874c48 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_19-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a0590355a2b4ed0e30fc5cd835b1961f7250c4e --- /dev/null +++ b/8b7178b13b/global_step84877/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b3cd0960d3c1574827ecd707ada7f0eb4120bb901a46f307c4c68e87e43ed25 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_19-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_19-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1595b3cbcd4f56d1341285d3891a86527ce964d --- /dev/null +++ b/8b7178b13b/global_step84877/layer_19-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33d611cfaace34a0cdd1387e21a2d84497f2e4af2ba2cd6cf6ce91adbdd08743 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_19-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_19-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdb57094e1ef11ac9ae63ec0b83e7408c99859dd --- /dev/null +++ b/8b7178b13b/global_step84877/layer_19-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1499a39b35f3654508a9b82fac5715f7d5a451a94d0b75c8f6a6c77edcce1f1 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_20-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e4d678bf13a8d1882d288534c2a4b1a68a26574 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c41fdc36f4612eca2eee442d60b8c372f9096ab15c249349c03c5b96971b8df +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_20-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d19851d85d0bf925a0effeb2b085da174cfe360 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34f4d2dd4f59fd2e23e9600421f2390952fb66a6d1dbeb791765d47208447578 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_20-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_20-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cedaba388eefc7674bbc697b7f9ad0c6cdebcb2e --- /dev/null +++ b/8b7178b13b/global_step84877/layer_20-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9aba191931451acde78a8565a43ae5612862f1cd5d7eb5ff88cdc2978fbabf8 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_20-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_20-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee9b5777000e2188f128fb671698e51a40f82339 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_20-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d41cebdb68b41b1a8c9fb9dbf8fa5659efa23d20067f3accaaa54006e8665069 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_21-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7faea8ca60eb42a9d1d47b7f7441c3f3c620fbdc --- /dev/null +++ b/8b7178b13b/global_step84877/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56db62ac3b3e877ba9a5b2fdcd2588cd8a7628b16b8d3f831ba8b769e8ca373b +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_21-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2c5a84cd4430db34f960a65bd6c36bdedbf8e10 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa384128cf36a67612d95af5049cacd5593f9fb655f7b79cfb0732d373824ebe +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_21-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_21-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..faef57e2b8cdeaa14cf054030820f1237f4f5ff7 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_21-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a75f03743b1dbe32dba2e0b96a5b74be645f1133c52677472913fc76cedaa656 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_21-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_21-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02c444f10bb85d03136fbc4111aa6887fe798c5c --- /dev/null +++ b/8b7178b13b/global_step84877/layer_21-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:054c445eea4c37fbe88b4ff52e9989fbc74de6a1b86bfbea1c903b5663db0895 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_22-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cf31089bfb4d304bde79500aa340628285d87dd --- /dev/null +++ b/8b7178b13b/global_step84877/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95bf70e887b4d9f99aa4fe2a7d437437aaf039153eeeaf28896c087f45d1a2cb +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_22-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbf010a4d3a07003c6692cac1d8fcc470fa7c764 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd83c1d891800b3b8a54752df1fdb317ae1dd7bb91183a1b1ccbe4cbf340e75d +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_22-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_22-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e34fbacb86041cd25f584cf02c441d8ab430f104 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_22-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35ef84055c6888e9b4ec3700914cb79717129b6a88e5c0c2c2584a6919a2e975 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_22-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_22-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2550153351e0ac7e55ed2a1665f2eace79da9872 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_22-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:595ab30874aa6f0a6623a9c881121985abd72b02c9640597246a65e0449b4e9b +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_23-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c181fcea5fdb46bbb9568e89b001b2582080499c --- /dev/null +++ b/8b7178b13b/global_step84877/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:543e3d69bbc97d242621f473e1ac0ad6c73adedbe7cf95f68f7e03c8fa790ff3 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_23-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2d11f2dcdb8a138cfd89a2e7598b09579aed99c --- /dev/null +++ b/8b7178b13b/global_step84877/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9b31ee80a49b09bc4e4d88e5eff0e683b383fcbe9175d15bebb9203c61a508b +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_23-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_23-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..957d53d9c5723da5c4560f2140bb93cdaf6c3747 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_23-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1151ff159f5629b9ad3e8b4b735c7d8f8bd4f0470590360d9eb94efcf6d6023b +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_23-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_23-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da12c1ed992be54dc9ef3285f24a9d91932b244d --- /dev/null +++ b/8b7178b13b/global_step84877/layer_23-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35076355a59ab3cc1b67c74e3b0d112d19521942bb73bdbe3abc14bb34f718d3 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_24-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a658cfdfa4d9e46a3e0c4df26e34060a0099953 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ac1504135712596ceda890ced990cd9c122adb77215900a3788522532ccf797 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_24-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e587fe8e0777982efd9d6118d67cf63d676cbaa0 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:865e811648ae2e9100d73f28ac32d07cb1ae177f9244f39eb1fe8b947eb29e0e +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_24-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_24-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f16a7a377d49fc539dd530ab24ce822b5a2a7335 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_24-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33090af04b45ec3ba74b5ea227449a1d9e3338893af32b4d2003d2be8d153e39 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_24-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_24-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a919aff77aed78f381206f5f81a491a796644ab9 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_24-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b1fe08ee816670357a726a200be1216c9214fec4e4bed5e74733d22c65e7f56 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_25-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0585a77499da2eb4b061e91842f72d3d34afb032 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08033dca2624c789c7a8c8ed584633666de64835d639dcea5ab74f4ed5494877 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_25-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1eb1f40299e2c61206b1fed8cb91a9ebff5f599d --- /dev/null +++ b/8b7178b13b/global_step84877/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b764bf042cf6fc4ac9d2d1838764cd000f3844f9df9e05eae12ac30bcf278b81 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_25-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_25-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..830eaab7050128e282f5041ebe10f36fd98b9436 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_25-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45abc20b17d0c0610e492848af3ace24bb75ef1c6c9740ebe9c52d80745c3fc8 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_25-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_25-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77ffae1a742fa304f99849bec03cb8eeadb1c331 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_25-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:183505316e0574b98203a71f71fe77184d4f3d978c3696e63b896d7e3ac22c04 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_26-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7cc91e5f9f791c265f3bec58933c957b9fcf476 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84910929e1b3b87518ad1c9410864c85f0b3f4202e3e89e653294775d579977d +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_26-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de31aed667e37a0fde21ab17715b2429a98059e2 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2edd3cddb70847f7f67a1ea7a4040ec23d7fd0c33d9dacfeb9ef9f824fe562d +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_26-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_26-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac6d04993b9776d70885919a2fd430328cdd138c --- /dev/null +++ b/8b7178b13b/global_step84877/layer_26-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cde93dc9ae74862dd3256bfe5917e22499d99b34dab84d0c61be95a75f2e555 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_26-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_26-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53419a2b16cc7322673bc404410f5cc7ddaceeaa --- /dev/null +++ b/8b7178b13b/global_step84877/layer_26-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c82b79b8f71fd1a38a27c7a67a75c890d4af1a09d2e8a4005d5540a263fac06 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_27-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c521bded77b9123a407aa2dc306102d2923c2ec6 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6d7d928a9fe6c23d03693c8d00ead4ec03992a80b3aee3dc19a3c612c59590d +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_27-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc602a45d344862a1c5fac2a4a1033a72943e770 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3234be945778efdd2b546f6c3fa8f3a36ed1f7cb500cdce3c73d80e700b7477b +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_27-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_27-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ebee835063a23682b26808dfe679b0f39613970 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_27-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a578245f24cc9245c3b6b68e586449b3367e447b14b5033e82f4a793a4789e49 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_27-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_27-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..355271311a12a6c3c99e77696a65a795fcb66b55 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_27-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32f28eab5541e7161ced7039ac93586259a125cd3a33838dbae5b139c1db26d7 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_28-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c9441e201a7016b009eccef1d2c037fc381c42e --- /dev/null +++ b/8b7178b13b/global_step84877/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fe98a6b7672585e0243ffbd4e5018b22754674e00ac5522bd4d5a93c2d045bc +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_28-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44813b1c1f4eda9ed7b096cf8777c75e1f75101f --- /dev/null +++ b/8b7178b13b/global_step84877/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30f22a7c9e8bb09a59bf7a3d36a761ab7c2daf7b2c6f5e307cd0b804e62c3828 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_28-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_28-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db664dbec864520ee0e80e6ad9683b446040733e --- /dev/null +++ b/8b7178b13b/global_step84877/layer_28-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:042d00e26f32c5291dd89ccca445fec678e7fb4ababe7a751a96d45aa0c3ce90 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_28-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_28-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c537e7df7929c56e824668870c4e2e9574c299f --- /dev/null +++ b/8b7178b13b/global_step84877/layer_28-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f2d1691e920377f23455ad7a270274ae3d7170791cfbcb8ab6081013600519f +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_29-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99c0784db39805a465de98bf48961c3960f6d944 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46da7f1de0dc332e7689c9095964397319e00d05b48aa6bc20cda7829c19397f +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_29-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1a5f8be6d5943effd280af139aaef7f588b643c --- /dev/null +++ b/8b7178b13b/global_step84877/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12390593eacb3896bf859322569e1f97e3046b1c9e9860a770ae8b31f5ad6afb +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_29-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_29-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f089f9e29c5ab08edae648d4e219ca7a0bf0efa9 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_29-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc07070274fbefe00e6cf2b9577bb29c0e45dc990e3401e864e497c10f6fef99 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_29-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_29-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2805715546e38fab8330b2d0879d7c5f13a2e220 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_29-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d851f8649e161688f1128ed41c8fd3a5094e7c37276cc7be668fe5b56339101 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_30-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78393189c0e9cd5f2d34886a2d918b3a33211fea --- /dev/null +++ b/8b7178b13b/global_step84877/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dd21f1ae87f5de1061ff4845b387e02b507f3895599270df0c4540ffabb4b94 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_30-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..912111db487977951b798b8398d960e5c9fe96ce --- /dev/null +++ b/8b7178b13b/global_step84877/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33d93de04b62bd55c9a509ddbb61c9ca14d421e66d67a4f041ce16359f3f6b2c +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_30-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_30-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b035511c95228eb8d8ba3929491b4b5b7f9bfff --- /dev/null +++ b/8b7178b13b/global_step84877/layer_30-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51111d73870159c4c81bf80909614248a8b6662661619d214eccc355dbc7b8ea +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_30-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_30-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3bb0ddc58c0cbc4c1a6a55395dbba5778743d27 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_30-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bee89c177e208ca5b897c4e76b19dfd8ec6097ec0bbb93bfc49cc11355e3cd8 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_31-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4483013a89a52b61711ec827ab0cc236a7b3f01e --- /dev/null +++ b/8b7178b13b/global_step84877/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3aacc37a224d82599e0ea97d86a08adcf973b2f298194681cdf675caac2c6e3 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_31-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77bcb8785480ea652ea14e04614014c17fd9b1e8 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6deef8541e31716d6065329f554950e195741e723baa7a2a3d03cf98961194b +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_31-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_31-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8194649657e3a6de5fd18038639103db83bf556a --- /dev/null +++ b/8b7178b13b/global_step84877/layer_31-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7bdf44f210984444a45228c775caf1de99f910ccd593a13bfc107c28e8c13b3 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_31-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_31-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac860991e5d49dbdaf417e4eece0c69e84575e87 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_31-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ee393ec1aa66dd21fe050981ff60e6e9e7aab9642b3d539faaaf035763649b3 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_32-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26b46b467d37ec4732ee72eb83d43d2b634a9e4d --- /dev/null +++ b/8b7178b13b/global_step84877/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48cece145b23eef7c17aec823ee35a290fe2bc1fb828ffe46bce9f755fb3b0a3 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_32-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4f21ebb18f05a0977a0347ccec353fa522b8c34 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62096d90c82e17fdf3375cefd88c33eb49901c8ef122a555b457321c84b05446 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_32-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_32-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39f76844c79991fb765898c02b6831140614ba3a --- /dev/null +++ b/8b7178b13b/global_step84877/layer_32-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d8177c89fce0d2ddacecab08dfddc8b949492cd3b29917eeb3ee3c72b489b2b +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_32-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_32-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef1a80dc8719c8ad69664cbeec58d68a1d6e4c57 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_32-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e9c78373f7862134f223e39420b1009285575288be8010abcf75dc11a9039fe +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_33-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc9f2489cac6e3f707a8872d19377ee863189503 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfcfe821a54335e6e0983b7c87033d1bc5c6d97a216193510c9895023a80a1ca +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_33-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a4318a8694a7a0b7c93cfa7232d48940e56ea09 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1729a0545dc0a2c5fb1f0e2f2c437e6501c84e0ce5a0539a50f5f8bc701da0e0 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_33-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_33-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a4c1062d92fbfb72c05064a436067f37628422e --- /dev/null +++ b/8b7178b13b/global_step84877/layer_33-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccb22b939938c8dde4230c0fd3998b19a701a06207cbd923dc7456dffc482796 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_33-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_33-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d03b18973a7ca3c45f9c5ba7d07eafee7f3f3197 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_33-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7339bc3d1a812933467e38ec6cdbd1d0ad4812a77ceb6a98d0bf07f87ef15b7 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_34-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c1339240a6f99e5464c0ba3b6a3591e584afa81 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60da5fc50a6707463533203e2b1190548863b52d575e44ff7082e98edb908dc1 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_34-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12439539b1d4145af65933c9964bd5d72c1abeee --- /dev/null +++ b/8b7178b13b/global_step84877/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b3ef11db3c57e455f11e9a416053f6124755adeceff930a5dce751fddac5313 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_34-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_34-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bf513d4911c50a4e54952d4820cfbfcbcfd5e5a --- /dev/null +++ b/8b7178b13b/global_step84877/layer_34-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62589b1e3072fc7b17928b1db49904ae292beb68fa79fd1763238286bf17f527 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_34-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_34-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0b234d932039d8b20fbba603cb097baebc9af64 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_34-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5ff6cb758c08935e424409e4bbf6c6af1aafd836fe4159ca3da21795929a144 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_35-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1d748f3be716460c05708c3cea166d99c754fe2 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04a7f0cd1b5eaaaa6b23391b37fc544d8e09efab53f6f8bc6d438b3c7791fcbd +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_35-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4272fd9a8f5560da4d5304dfd9c8c6ed1847172 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf3d4f599e92afdd6257b0c81c5fa118f5a75852759376702df5cc25fa6a1c38 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_35-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_35-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20bf220688c8fb36fe5bea2e45ed3ec14cab1113 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_35-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d41b48253c3f8098afe4cb84312a69fdcf5db0efefb663416245c3beedd5c53 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_35-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_35-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4513608abc8f9e2321fe722c7938f1f590ce58f0 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_35-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acb99c609d7e7be6db6ca07b68525ff8a7ab788e2c80225d156d686daa89a52a +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_36-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e447d1e3f2e66a42901bc671afa92d939cfe590b --- /dev/null +++ b/8b7178b13b/global_step84877/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e87b58fe0a89300341f2db67fe019a7a75386d52b041e1e421e6235979842ae2 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_36-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..028b1c25608d603e0e0a4b32b49a4801dc9a525c --- /dev/null +++ b/8b7178b13b/global_step84877/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65acd8694623b05c06d1ad9cf6f1e17032e387ddee00091a9fe129dd456d6f55 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_36-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_36-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..beab99aabcd5be57c02b1afc96cc74056a9227bc --- /dev/null +++ b/8b7178b13b/global_step84877/layer_36-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d52eda66222350a1a73a6d5299fb8b6be4b63bf6482fc730d3b9b33a01b4e70 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_36-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_36-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8afb28a00b2d6a162906291ee8ea83c07677b032 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_36-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94410afdcfba0e31358e8b946e193fdc84749aece817f6906fdc359f70a22a0d +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_37-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e26539e6b1c18bbae0ddeb176d4e8befac3bc1f5 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bedd3d02324a75ecf527adf89175750ca85ac9ec5390fdaa442865ba5eea7fa +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_37-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d504f0d8fa36be8a24f93cfad003c8796685526a --- /dev/null +++ b/8b7178b13b/global_step84877/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13c9fb0c9c78f629c4b751eb0d0215a416a2d9ec62871b83b7016e5b212540e1 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_37-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_37-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbe56b3f12c398d51145776cb9f2ac0916774d56 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_37-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a61d0f55b632d3e9ba315cc118010bb5e96b2104e6ac022cfb6e5be395040046 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_37-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_37-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8640cdadc5fa5db1d8b94e59d099d3822b5f74a6 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_37-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21023c16db8dcebccb1ee8216a5cd433a2b8181a2c7e3e151e5156147f5118f7 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_38-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae7b71ca35eea6ece71fc87d0c88b8f127ce0bbe --- /dev/null +++ b/8b7178b13b/global_step84877/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad857f92745f6e0b9c5f8d0a4ecf8e1f2f16010ea6858280acce208c913cbd7e +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_38-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f64f00d1cc991be926a21e952401a2a85fb533f1 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:295f7b3dcabcccf72ed2b534eb0256c99f23165815d6d2ae5da8ac751742651f +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_38-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_38-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c015d9362be2b21ddf58204d420adbd2726be811 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_38-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c70d9aca6bdfc52073ec3de0569688741ff4a41aa6776296f6eec3f7230733c +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_38-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_38-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb945858c73041343da2d79341b5653bb169bea8 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_38-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e51746d4f4d53d3daa787da4f9e068fb377ca97838b5d19dc4c99e2465a1fe5 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_39-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_39-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe9dbd264120c3010e2e03febdab52621394bd2f --- /dev/null +++ b/8b7178b13b/global_step84877/layer_39-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14f7ef2b81d4bafdbab61d57b80b6b4a5cb81057d4977781c84a93cf5a13249a +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_39-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_39-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fd94dc8337a7511b4d5b481ee12d3e87f578732 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_39-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25b36c6bc562322033b593766defca6abfa26ff15967804c33da0fc66627d25f +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_39-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_39-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2226331600c703e1e5661c20fec5c14a5baecc1e --- /dev/null +++ b/8b7178b13b/global_step84877/layer_39-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fac2c9bb024d71df4089efba7ad6b91cc4bb9d293edcf82f8d6bea32d73c4344 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_39-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_39-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94ea8c83c5148e31c636a23c480250eb043f9d04 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_39-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54569f7605be36e87628253fdbfc49793cc29f35a83081c6f277e39e422c1c4e +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_40-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51dc9ed7cfd17571c74d4ecc2d22fc2a62eb7fbc --- /dev/null +++ b/8b7178b13b/global_step84877/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:872e9e9196d46107007935cbe235244caa11450a7dc794e1730a98975ba05ac8 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_40-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a1d3de9707a80d53f17581e68f4f1df2b3ee4df --- /dev/null +++ b/8b7178b13b/global_step84877/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b2e5a1527a4d6e253f22d6bdefb19063beb8e4e943ee3a01c5517841d0f856a +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_40-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_40-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c68b7f64a4eb94250556c28e58d3d91d7c43dd31 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_40-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c05c3f97914cdec656987f30aaf7a0b7bcf3901a608af7c213cb4c59a72fb99 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_40-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_40-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51eb506a91fec743bda009f03dbcc695e5372b86 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_40-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9e0e8e593cd37f5d99586353604c09d70f4f8e077ba8f91b4c55af696ce996b +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_41-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_41-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ce16e9352027194240219b2017c2b15f8ef1fb1 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_41-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fbb3474c272bd9c1fe282bf90cbaedcddd9cd8b583ddac26f57ddc4d97301be +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_41-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_41-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb9871b3d21a2f1b83c6809825a5773ade2dc0bb --- /dev/null +++ b/8b7178b13b/global_step84877/layer_41-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acd32c384a606364e0144077b8d0013905172d1d22d5baf4f175e1c4afaa531c +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_41-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_41-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c591674bc7cdd178c5e01202537e947cba9c624e --- /dev/null +++ b/8b7178b13b/global_step84877/layer_41-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d6eff913e774aed521d0085bca9db46ef8992fcd8a70e40b34c5a3b56247c74 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_41-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_41-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4864e5b3a5ef6738790b44b44d0a0dc217680090 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_41-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72410fc9203eb36a2dfae564d4504a9f966f51bb91e058c198857cf1a108b3b8 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_42-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_42-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3890098db0ed50fb36bf9fd2a84762d59c4f3e81 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_42-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16c66fecb6c555d063a70af1db5ca9297bd36c831e9717eb8622d4c083b1ee45 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_42-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_42-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f79b9fbb34d173bf80a4a7dc52be75ce3c03cf8b --- /dev/null +++ b/8b7178b13b/global_step84877/layer_42-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f8372ab38e32ec4ad747b50149bff8fe3d5ca6d8a6a415549bc79e7e200cf9a +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_42-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_42-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a030d06684bee0180f9a26555f66dd5729cc2e80 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_42-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0004293cdea47fd828e96c8a11e705c6dc006764b20bd72f941e6727c12feaad +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_42-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_42-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df0c78e655c6e894ba5ceab6fec55325c4f18978 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_42-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28c82393b2d708908f9254277eb5b4f6654555afc2fbe490c2bf132d8e89952a +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_43-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_43-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51d8e8355ca0e7ad372ad652658ec192f53cc121 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_43-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63403a4a0d78d016beab9af53a3b5dd1da2a4a15484783392d25d77437676a8f +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_43-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_43-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65434d09d50b1186c7208336f7ef2cf49372ea99 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_43-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dc685671a1049f789e823a5b82ffe1d8da4129d2667dce6e368d8f3bc0f8fc9 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_43-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_43-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ea0a18e362edddeaad6eff05020c5ed4ba0cbec --- /dev/null +++ b/8b7178b13b/global_step84877/layer_43-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1860de6b29e4a756bd1fcd71ddf09ceda10b98cf20c712ce424afdf253288f1 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_43-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_43-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67f42d83de78c7f24d5d7eff1b40d74482985922 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_43-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12e96cc21bb76d9296b7319ac6ad6e328fb1ebc13a09d9a97abd5f8903b6eef3 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_44-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_44-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2466313096006927ea662949b90fe332ef238bdc --- /dev/null +++ b/8b7178b13b/global_step84877/layer_44-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f367466eadb6b9f153134b6f5ed2a70ace0df31c0f6a0b072dd5d02ec00fad7a +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_44-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_44-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95ec7dba50a923cf644e221234fcf9b319ae665c --- /dev/null +++ b/8b7178b13b/global_step84877/layer_44-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d8d709836376ec5668bdc2e14e300f22c12911a18675d5ed73480d0445064b6 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_44-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_44-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33e506b006b87d016650e7721a175f74495c5238 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_44-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7666dd85fbc84f9ff210e169b769cfd604b6092b33276021f8290ffe544aa1f +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_44-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_44-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41511f0bc64fdd277a87b276dff34c4c11c7728c --- /dev/null +++ b/8b7178b13b/global_step84877/layer_44-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:546ed0dd9a89a5b28512c8867a97e3d44ce327a08bec2089c342dbb32ec56568 +size 100731139 diff --git a/8b7178b13b/global_step84877/layer_46-model_00-model_states.pt b/8b7178b13b/global_step84877/layer_46-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78edefefbaf976396a4d0b772dc496f79323b543 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_46-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2503d030a5b8c53c80a70fb259bfab93f16e1a6d0d33df18dc6ab453c1bfd7db +size 17603 diff --git a/8b7178b13b/global_step84877/layer_46-model_01-model_states.pt b/8b7178b13b/global_step84877/layer_46-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..181d0dc5c535854f8f80c71e1eaca3819818a2eb --- /dev/null +++ b/8b7178b13b/global_step84877/layer_46-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f55d34f2f731e4853d878291d3b8c08ac44ee7a3da2abe36c97c04fdf6c86b7f +size 17603 diff --git a/8b7178b13b/global_step84877/layer_46-model_02-model_states.pt b/8b7178b13b/global_step84877/layer_46-model_02-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fdb4bcc1879b0885260ee2c7df0dc113498bd50 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_46-model_02-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e42c442e1d7c80adfcb25c34bdd23c962555cf21cdc2e7ac94616e3e9fc73f36 +size 17603 diff --git a/8b7178b13b/global_step84877/layer_46-model_03-model_states.pt b/8b7178b13b/global_step84877/layer_46-model_03-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4f689e68be36045344ea4df063a26ce95017523 --- /dev/null +++ b/8b7178b13b/global_step84877/layer_46-model_03-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:082261d7deffca365b9be6f9b756e619a07dcdbc2792eb16e824714945a2c30e +size 17603 diff --git a/8b7178b13b/global_step84877/mp_rank_00_model_states.pt b/8b7178b13b/global_step84877/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4521a63f1691d1dd385869fab0e1100a660a1a7 --- /dev/null +++ b/8b7178b13b/global_step84877/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11fdb89be739d9495dedf199be1c9cb76636b6ff760ab20ef704ff65a8179ce8 +size 32563 diff --git a/8b7178b13b/global_step84877/mp_rank_01_model_states.pt b/8b7178b13b/global_step84877/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6d5323468c140ddf61a3fb417ee5ce327ca187c --- /dev/null +++ b/8b7178b13b/global_step84877/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8252da27afed751a5ae3b4090c7527c0f60c718b74391cbd30a71c3970002283 +size 32563 diff --git a/8b7178b13b/global_step84877/mp_rank_02_model_states.pt b/8b7178b13b/global_step84877/mp_rank_02_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf1ac0c3abe7917c7ea07cd2a2be44be4aa6193d --- /dev/null +++ b/8b7178b13b/global_step84877/mp_rank_02_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:104cb6094eb8ba38cbe9d3776e6e509b971fb1edfba92f1983d289c56e034d49 +size 32563 diff --git a/8b7178b13b/global_step84877/mp_rank_03_model_states.pt b/8b7178b13b/global_step84877/mp_rank_03_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18a34ee2c03874bde4a277b84f9108e5d0c4af39 --- /dev/null +++ b/8b7178b13b/global_step84877/mp_rank_03_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:708a068d70a17e43f48b261785ea8a9778339bb56926b8e7c238baea01110975 +size 32563 diff --git a/8b7178b13b/global_step84877/mp_rank_04_model_states.pt b/8b7178b13b/global_step84877/mp_rank_04_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0edb25b2699103e4f92451cb9bad8d12185a6032 --- /dev/null +++ b/8b7178b13b/global_step84877/mp_rank_04_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:958fad8d995c111b5644992ad9b5dddeea5e9e469a47f03a67affc46fb0e9abc +size 32435 diff --git a/8b7178b13b/global_step84877/mp_rank_05_model_states.pt b/8b7178b13b/global_step84877/mp_rank_05_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d1b5b11584638e4a99a8cba2a116295fbdae83f --- /dev/null +++ b/8b7178b13b/global_step84877/mp_rank_05_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3db7001bc98106f1cd13c56f2852879ed580353c72a4d904de643c95b1aac59 +size 32435 diff --git a/8b7178b13b/global_step84877/mp_rank_06_model_states.pt b/8b7178b13b/global_step84877/mp_rank_06_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..111718694383c1da016e905ee09e7251b642356d --- /dev/null +++ b/8b7178b13b/global_step84877/mp_rank_06_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a15103394c348b4412241a1fa34b760089b28611178aa2a2f33ae04261ee180 +size 32435 diff --git a/8b7178b13b/global_step84877/mp_rank_07_model_states.pt b/8b7178b13b/global_step84877/mp_rank_07_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3a3f25331f8eaf2a8d0ab68730d43b6749e796e --- /dev/null +++ b/8b7178b13b/global_step84877/mp_rank_07_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aec064deb4c439b0fca83455966b8e850ea39a7ec8f1d986a0bf95b779e6e849 +size 32435 diff --git a/8b7178b13b/global_step84877/mp_rank_08_model_states.pt b/8b7178b13b/global_step84877/mp_rank_08_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9c919b49f3e7158e14bae6a6f2a4f9249cc071f --- /dev/null +++ b/8b7178b13b/global_step84877/mp_rank_08_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5204c4399eecda77505c29eb8e44c3663ec6d4620ee4c4de57a73a6af285888f +size 32499 diff --git a/8b7178b13b/global_step84877/mp_rank_09_model_states.pt b/8b7178b13b/global_step84877/mp_rank_09_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fe637b0ea7cad767218769a7eb38d02e284071f --- /dev/null +++ b/8b7178b13b/global_step84877/mp_rank_09_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fc01add2471535d69300d891972f881c2dea266282d8e1e5a3a7c48de9bc9dd +size 32499 diff --git a/8b7178b13b/global_step84877/mp_rank_10_model_states.pt b/8b7178b13b/global_step84877/mp_rank_10_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11828f9862d33c9a861e97058af3168271f4b049 --- /dev/null +++ b/8b7178b13b/global_step84877/mp_rank_10_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc707c01d6d9b434b418177f1a428725fa7694ff811a43f69037ae1522ffa05c +size 32499 diff --git a/8b7178b13b/global_step84877/mp_rank_11_model_states.pt b/8b7178b13b/global_step84877/mp_rank_11_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95323ed65f954c9ec105cf8e70a039d9ae4b4b95 --- /dev/null +++ b/8b7178b13b/global_step84877/mp_rank_11_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9075291eda7400c894480bf472e8a195c5e6bd5065a3cdb0706968149101aa58 +size 32499 diff --git a/8b7178b13b/global_step84877/mp_rank_12_model_states.pt b/8b7178b13b/global_step84877/mp_rank_12_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c0db76cfa291b4dd9850a0acf43ced2b312a5bf --- /dev/null +++ b/8b7178b13b/global_step84877/mp_rank_12_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4952ae3e7e72a0455f516cd3af725d12564588beda1f55da127a8687e9fbb423 +size 31155 diff --git a/8b7178b13b/global_step84877/mp_rank_13_model_states.pt b/8b7178b13b/global_step84877/mp_rank_13_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b00c54e6132b5284b65baab13f97e5a77296d6aa --- /dev/null +++ b/8b7178b13b/global_step84877/mp_rank_13_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b116439437707b5268cc1b2ff8b23fca995e70ef479760f806817dcc554b18f +size 31155 diff --git a/8b7178b13b/global_step84877/mp_rank_14_model_states.pt b/8b7178b13b/global_step84877/mp_rank_14_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4fad58a1579f2fd6c0d2f8c34c196ad3d03ffbd --- /dev/null +++ b/8b7178b13b/global_step84877/mp_rank_14_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5fc65a2f1fcee3d5c322413a0d8e3157da93d27e300f7d7ccb3a5016bbe4940 +size 31155 diff --git a/8b7178b13b/global_step84877/mp_rank_15_model_states.pt b/8b7178b13b/global_step84877/mp_rank_15_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91f79a63df85270b7a6762857c25b36b317c65a5 --- /dev/null +++ b/8b7178b13b/global_step84877/mp_rank_15_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76c8a877f496c425ae0be614b303b1ce1b938e4f23482022acfa271296e846c3 +size 31155 diff --git a/8b7178b13b/transformers/config.json b/8b7178b13b/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..22c9280969b993eed6debb17878f6b04abbfcca3 --- /dev/null +++ b/8b7178b13b/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50688, "n_positions": 2048, "n_embd": 4096, "n_layer": 42, "n_head": 32, "n_inner": 16384, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/8b7178b13b/transformers/pytorch_model.bin b/8b7178b13b/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..b49ef91adc32e8b04f723fe1abd4189990b26202 --- /dev/null +++ b/8b7178b13b/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a17cb0f1a55f0b1d38a7357dbaeb05e61795b6280a2812b747c9f817ee966d6 +size 17700448349