diff --git a/.gitattributes b/.gitattributes index 463557ab2ca226e0eb475b488049813ff7df114c..1cc57ef8f90d95ad13febc5f269c72797f77c622 100644 --- a/.gitattributes +++ b/.gitattributes @@ -80,3 +80,51 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text 8b7178b44b/evaluation/generation/examples.8b7178b44b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text 8b7178b44b/evaluation/generation/examples.8b7178b44b_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text 8b7178b88b/evaluation/generation/examples.8b7178b88b_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text diff --git a/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-web_nlg_en_PALM_prompt_0.json b/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..0844e62727381b85d3233b7fd42c3d65c8712664 --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.347289354458488, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03777797007924809}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.079226368742227, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0023231969845277887}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.28110828630725015, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004882004381200993}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10890954353426278, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002110258935484955}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03743726607123581, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001494228694268955}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.13690374884005102, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003169133187878269}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05172430149730381, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013180585408877222}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07666350308702279, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0022367957170880146}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2745019482026448, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004789753920178336}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10554978776184795, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020007799763877027}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07592638133051025, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002251359653603086}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2686557447211624, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004613052990575398}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10411236694388043, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019983020211639833}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-web_nlg_en_PALM_prompt_1.json b/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..71ed80e1098404d06c3b8daf945d69fe1fb0e3db --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5749625372797772, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.042168587225678913}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.1384507797063748, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004372707845611215}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.322644364844527, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004855940304467451}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.1639618887300654, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003768473720694237}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.0725164426950792, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0030197107273513208}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.16687390506721525, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0035088962671374286}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.0838728953683248, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002551976059024005}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.12455299793053924, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0037936801945088155}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3050028170207448, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004518320595879189}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.14973459838273895, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003227143648327153}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.1263163648899627, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0038597130269363692}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3062159795615415, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004522396040564721}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.15125353657464896, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0032779530465988412}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-web_nlg_en_PALM_prompt_2.json b/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..a196fa9e5ea8fbc1cecf1cc2afb09bae613ebf3e --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6896289267842831, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04363432869368013}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.1736763143186271, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005190144069158226}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3690495199973296, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004674550419980399}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.19577491362940544, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004183820712066921}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.09630923485520457, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.003591484421705004}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.19774238776363945, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0036773455774089777}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.10468204406915697, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002958633901985044}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.15346964126360133, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004394358403285555}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.34605615384304983, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0043553659806620975}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.17655301985743188, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003543990303517691}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.15737438288230765, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004551780258151066}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.34891501370883077, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004358767783710016}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.17970682314011696, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.003629660902642662}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-web_nlg_en_PALM_prompt_3.json b/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..5bd3ca693ad2346ed59545be2f896a6f42cb53db --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.7168649256709774, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04675221435801664}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.1766984056786614, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0052889863501627}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3784023798729607, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004834949146967397}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.20039314889286589, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00433393844787534}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.09764044765164406, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0036619448797318528}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.2030335209107597, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003804312974743258}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.10711581894262515, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00302754276771825}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.15566438191020568, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004489975630701125}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3537310697482285, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004433439714918285}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.18005823477527308, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003625480259314596}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.1606361822943105, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004693428623221418}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3571516509838202, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004469628307077723}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.18404319632429025, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0037645994118713916}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-web_nlg_en_PALM_prompt_4.json b/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..88568798edb91f87008a1f0a2e087a478f896147 --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.8264767377736691, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.053779296385247366}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.1812068418232479, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005398716331751978}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.38369035451056227, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00470013713630282}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.20221675887809062, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004283401665288551}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.1006261222318028, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0036927051039995647}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.2074416749104224, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0036680698832641224}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.10880911597097326, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0029539167777379253}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.15862122681407606, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004530792062039435}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.35743845572365024, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004293662429385583}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.18068778740178215, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0035531966464061853}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.16438209047726673, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004775185780341334}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3611996661245711, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00431294873519373}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.185234182101754, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00371289144584664}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-web_nlg_en_PALM_prompt_5.json b/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..c93e2e7b55d55725400e33d46b2962e043c0a5ad --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.8765489182001927, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.040019456401903304}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.1926905497088421, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0057538188799125855}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3858328625547419, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004823164304577201}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.20880684983729342, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004530179904806841}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.11101027585585174, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.004140682260724748}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.21158156307350992, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003943074328986311}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.11565656452634464, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.003314764756228703}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.16975713372550302, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0049633182199218225}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3591348058816613, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004445791053730718}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.18694354311801048, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0038293768377802495}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.17553725023286618, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.005177574879953629}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.36311828129199303, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0044570305199087895}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1915290665625795, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00396816747113494}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-wiki_lingua_en_tldr_en_0.json b/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..3c430d6c7d07e9730d31422756b08ba28cf5f176 --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1716696703091672, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0028501359020609955}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.25185497103999677, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0034752671023028777}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.18563962193300107, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00254964484535964}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.04455795738149438, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011159745679413468}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06850978198098658, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017237693104594396}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.049529716403418626, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001152868080944952}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1292734642683531, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0022188669387071605}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1943570396317403, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0027761702028766522}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13995045719718288, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018763707447302035}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1610229468194331, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002727168940548498}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2357960382787708, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0032789217359646683}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.17363683324091103, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023982582496962375}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.586033759423314, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09221854298529836}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-wiki_lingua_en_tldr_en_1.json b/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..55cc962c7017b58009e9ebf9209dd9647445bdaa --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.8b7178b35b_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.22141486924288373, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003489092311505774}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.21774103131853748, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003219238261544544}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.18742769556123198, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024179522944743578}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.05911494441028749, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001977492552657427}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.056021987595245265, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016925719239639409}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04749462077218236, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013391994596319457}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.17052813755243684, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0028543436290086777}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.16498921391985125, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024957799702815765}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.14177658902154563, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018452092691051947}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.20843084756852662, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003321140474934239}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.20397276049127364, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0030133958209501476}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.17566654570551468, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022619479293200127}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.0885083531376645, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09894775701896347}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_0.json b/8b7178b35b/evaluation/generation/agg.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..b9354ac699fffea5b2b8ba3f143d569857e3928f --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 3.8008125605460465, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08334728702857473}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.2090865590305055, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018470177010718961}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.38188549726437987, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003279728734456605}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.2613118947613821, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002127912583794242}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.05673694028468428, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009833704090490367}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.1101409383371642, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001995492794975982}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.07297635058372318, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001261248605220041}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.18275732889261928, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013921067012969746}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3338079929800571, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024505755903694226}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.22836186321205557, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015605125797972495}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.17512630400560542, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017783983400275266}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.32141092125405557, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0032662985068743528}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.21899459401932223, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002102657843438912}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_1.json b/8b7178b35b/evaluation/generation/agg.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..c18b7f5c8b941c50fb01eb33d046096166fe4d7e --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.455563496168116, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.15428951986028144}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5954981850070853, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032755377697093577}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.44832902186902923, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0030688387452721486}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4844618589871223, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002388878380866762}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.29040989982948295, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0028204861869818784}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21450317916657013, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002222395267553394}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.23224231794118463, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020931392807158806}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.43368332329208353, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003056248156608264}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.32270327842717356, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024894724353540653}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.34990734371381305, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021300316703662904}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.48684291022612447, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0032370809243618716}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3651475528395549, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002807567486848305}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.39499604706438096, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023754095690034817}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_2.json b/8b7178b35b/evaluation/generation/agg.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..aaf9b6a04a010833cf9be5bfa7063cc904cf4246 --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 15.187891510159636, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.2005340847158173}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6089225605030864, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031749506024181815}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4850253270309617, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029712295443402523}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5149400564373232, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002281960188799717}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.3125612676733449, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002807570058211188}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.24520830668256238, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023166169808109976}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.26064964037026866, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002149918786285521}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.45032557438452553, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002995769757075173}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3564750276333542, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002545550505071048}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3791251783681887, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021638392150190966}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5099476065779874, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003210910234266457}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.40596954377109, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002856919494329858}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4311876269636124, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024222285980316075}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_3.json b/8b7178b35b/evaluation/generation/agg.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..25241aac3a57f7388f46dbf02b10ef9209ee8c91 --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 16.060659394975822, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.17284642655126536}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6148474805598093, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003175147795291498}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4938729679272436, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029612490025592896}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5239878618101873, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022891503962730515}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.32141615003361074, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00284369777288176}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2546854150197406, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023748524797935944}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.27038735747786175, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002196480015942097}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.45482796385524316, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0030285934039142345}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3632799719766207, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025747603467030653}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3858853477225852, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002195201839278644}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5189202264105984, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0032211525451001028}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.41656979202046523, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028606302793073527}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.44212298577697895, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024314611034434628}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_4.json b/8b7178b35b/evaluation/generation/agg.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..b810905ab0d07cbcba573bf633d14a538a894998 --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 16.35064977606228, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.15318703610951076}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6141579219291876, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031375276423873367}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.49642790420160215, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002890279129158977}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5272948463681918, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002276632828321617}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.3216796674918701, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0028452669990831196}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2567141692534647, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002372105255220152}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2730606307438099, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002234438055141524}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.45388329842280073, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029409250663779253}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.36571295934350256, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025294206995360793}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.38874867977872807, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021952914125996665}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5193905306564236, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031731739172339655}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4201701863764282, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028340856821376906}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.44624941166081916, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024399419515776116}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_5.json b/8b7178b35b/evaluation/generation/agg.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..817ecb614922a4a1214964453b9ddd4e34a2174e --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 16.33989554218624, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.17192498787094718}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6138887802372733, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003148762043973577}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.49579908715969256, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002855704257905023}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5272012483217712, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022727033449929193}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.32296239014683903, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002836651143474931}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.25721295886814427, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023323863742251865}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2739732304449431, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0022083117263179994}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4557756119232901, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002957529253678058}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.36723275796263094, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002545583277155397}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.39053942113540757, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0022084680095602566}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.520413988660044, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003202124211985598}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.41985936033161986, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002793790259009851}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.44667560043167237, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002425231007898886}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.8b7178b35b_gem_xsum_article_DOC_summary_0.json b/8b7178b35b/evaluation/generation/agg.8b7178b35b_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..1ebc0812c01f8a6dfdd955e70502138d5ac513ed --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.8b7178b35b_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.14704474756783373, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00260243994472115}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3179426585120001, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005091359061361595}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.19497689185235167, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003037459759774}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.033133611529725375, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0012222134099385885}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07643755617885226, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002852925969928893}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04545175235793978, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0016613895167432173}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10872152825582168, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0020985136406316504}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.23420658227277613, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0038579727721169913}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14329622002037548, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002251083734524946}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.11878580563146314, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0022791200374934033}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2561567987942721, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004250537243559008}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.15671768300152755, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024938518539829066}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.9172897233734647, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07612979258741162}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.8b7178b35b_gem_xsum_article_DOC_summary_1.json b/8b7178b35b/evaluation/generation/agg.8b7178b35b_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..ccfc4fb1b0b728c8f5e50122ad61ad871a45f94d --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.8b7178b35b_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.2506117820029391, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004197193925421806}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.265051427357207, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004113838412416427}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.2429048922678839, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0035470294629619853}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.059355725931601024, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026146656506255265}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06240115907434781, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002528707836330792}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.05697362472735911, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002319852424027265}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.18675397233452354, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003437969762757092}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.19744938072178414, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0033460143453592026}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1806939148235656, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002897868234740968}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.18896297297256576, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003436743475620793}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.20147068575801652, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0034574795296360844}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.18340626109421165, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002921137289513508}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.9617243214867686, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.2121625238447871}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.8b7178b35b_gem_xsum_article_DOC_summary_2.json b/8b7178b35b/evaluation/generation/agg.8b7178b35b_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..4f1e3e6bd7008df6feb66d0d666921585da24660 --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.8b7178b35b_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.2862450933885503, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0042447208222623255}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2741637614630613, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0038690227267741645}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.2684969037756941, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003538515661007479}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.07370429393444561, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002782856999759695}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07014627514180007, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002596637645417416}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.06850101702956525, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002469575816155894}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.21544246954500543, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003580176542199536}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.20674126511922747, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0032887383484612206}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.20209449252255896, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003025686120342655}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.21658328451330233, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003567997453456091}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2083566653493878, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0032948366397107273}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.20333325134792413, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0030149542501899957}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 3.790180948775114, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.21949698226608796}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-web_nlg_en_PALM_prompt_0.json b/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..870ed5e39a4e5d301e1d57702ae0800f05b95cfa --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.347289354458488, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03777797007924809}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.079226368742227, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0023231969845277887}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.28110828630725015, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004882004381200993}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10890954353426278, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002110258935484955}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03743726607123581, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001494228694268955}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.13690374884005102, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003169133187878269}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05172430149730381, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013180585408877222}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07666350308702279, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0022367957170880146}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2745019482026448, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004789753920178336}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10554978776184795, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020007799763877027}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07592638133051025, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002251359653603086}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2686557447211624, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004613052990575398}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10411236694388043, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019983020211639833}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-web_nlg_en_PALM_prompt_1.json b/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..60eb546cdabcea07570c09fedde5883a72497400 --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5749625372797772, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.042168587225678913}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.1384507797063748, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004372707845611215}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.322644364844527, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004855940304467451}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.1639618887300654, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003768473720694237}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.0725164426950792, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0030197107273513208}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.16687390506721525, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0035088962671374286}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.0838728953683248, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002551976059024005}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.12455299793053924, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0037936801945088155}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3050028170207448, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004518320595879189}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.14973459838273895, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003227143648327153}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.1263163648899627, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0038597130269363692}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3062159795615415, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004522396040564721}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.15125353657464896, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0032779530465988412}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-web_nlg_en_PALM_prompt_2.json b/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..5cb1faa9f3b331ea4d1df60f6bac5635920547ed --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6896289267842831, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04363432869368013}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.1736763143186271, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005190144069158226}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3690495199973296, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004674550419980399}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.19577491362940544, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004183820712066921}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.09630923485520457, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.003591484421705004}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.19774238776363945, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0036773455774089777}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.10468204406915697, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002958633901985044}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.15346964126360133, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004394358403285555}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.34605615384304983, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0043553659806620975}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.17655301985743188, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003543990303517691}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.15737438288230765, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004551780258151066}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.34891501370883077, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004358767783710016}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.17970682314011696, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.003629660902642662}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-web_nlg_en_PALM_prompt_3.json b/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..76fe29aa7dbe144684e368bb8a94fb70b5c151ef --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.7168649256709774, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04675221435801664}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.1766984056786614, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0052889863501627}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3784023798729607, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004834949146967397}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.20039314889286589, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00433393844787534}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.09764044765164406, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0036619448797318528}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.2030335209107597, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003804312974743258}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.10711581894262515, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00302754276771825}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.15566438191020568, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004489975630701125}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3537310697482285, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004433439714918285}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.18005823477527308, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003625480259314596}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.1606361822943105, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004693428623221418}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3571516509838202, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004469628307077723}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.18404319632429025, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0037645994118713916}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-web_nlg_en_PALM_prompt_4.json b/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..63cdfdbd987f7d643c2d41d90706554b6717dc8a --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.8264767377736691, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.053779296385247366}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.1812068418232479, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005398716331751978}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.38369035451056227, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00470013713630282}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.20221675887809062, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004283401665288551}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.1006261222318028, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0036927051039995647}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.2074416749104224, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0036680698832641224}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.10880911597097326, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0029539167777379253}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.15862122681407606, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004530792062039435}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.35743845572365024, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004293662429385583}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.18068778740178215, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0035531966464061853}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.16438209047726673, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004775185780341334}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3611996661245711, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00431294873519373}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.185234182101754, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00371289144584664}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-web_nlg_en_PALM_prompt_5.json b/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..5a23658b003e3430871db289b80b79840176da3f --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.8765489182001927, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.040019456401903304}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.1926905497088421, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0057538188799125855}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3858328625547419, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004823164304577201}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.20880684983729342, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004530179904806841}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.11101027585585174, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.004140682260724748}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.21158156307350992, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003943074328986311}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.11565656452634464, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.003314764756228703}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.16975713372550302, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0049633182199218225}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3591348058816613, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004445791053730718}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.18694354311801048, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0038293768377802495}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.17553725023286618, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.005177574879953629}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.36311828129199303, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0044570305199087895}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1915290665625795, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00396816747113494}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-wiki_lingua_en_tldr_en_0.json b/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..31a99ee105df607c52b3b2a0e5d31f9d93bf74c3 --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1716696703091672, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0028501359020609955}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.25185497103999677, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0034752671023028777}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.18563962193300107, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00254964484535964}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.04455795738149438, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011159745679413468}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06850978198098658, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017237693104594396}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.049529716403418626, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001152868080944952}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1292734642683531, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0022188669387071605}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1943570396317403, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0027761702028766522}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13995045719718288, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018763707447302035}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1610229468194331, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002727168940548498}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2357960382787708, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0032789217359646683}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.17363683324091103, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023982582496962375}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.586033759423314, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09221854298529836}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-wiki_lingua_en_tldr_en_1.json b/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..c424d828e632b70d9087de9e48730576b1eb5f04 --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.global_step84877_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.22141486924288373, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003489092311505774}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.21774103131853748, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003219238261544544}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.18742769556123198, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024179522944743578}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.05911494441028749, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001977492552657427}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.056021987595245265, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016925719239639409}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04749462077218236, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013391994596319457}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.17052813755243684, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0028543436290086777}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.16498921391985125, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024957799702815765}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.14177658902154563, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018452092691051947}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.20843084756852662, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003321140474934239}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.20397276049127364, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0030133958209501476}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.17566654570551468, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022619479293200127}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.0885083531376645, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09894775701896347}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_0.json b/8b7178b35b/evaluation/generation/agg.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..ede56178bd6f13b783def824b3b0823d786f4f73 --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 3.8008125605460465, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08334728702857473}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.2090865590305055, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018470177010718961}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.38188549726437987, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003279728734456605}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.2613118947613821, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002127912583794242}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.05673694028468428, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009833704090490367}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.1101409383371642, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001995492794975982}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.07297635058372318, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001261248605220041}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.18275732889261928, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013921067012969746}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3338079929800571, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024505755903694226}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.22836186321205557, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015605125797972495}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.17512630400560542, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017783983400275266}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.32141092125405557, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0032662985068743528}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.21899459401932223, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002102657843438912}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_1.json b/8b7178b35b/evaluation/generation/agg.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..c1c66e4a649ce749281c55d8bf51bc7103ba4503 --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.455563496168116, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.15428951986028144}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5954981850070853, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032755377697093577}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.44832902186902923, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0030688387452721486}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4844618589871223, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002388878380866762}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.29040989982948295, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0028204861869818784}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21450317916657013, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002222395267553394}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.23224231794118463, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020931392807158806}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.43368332329208353, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003056248156608264}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.32270327842717356, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024894724353540653}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.34990734371381305, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021300316703662904}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.48684291022612447, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0032370809243618716}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3651475528395549, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002807567486848305}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.39499604706438096, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023754095690034817}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_2.json b/8b7178b35b/evaluation/generation/agg.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..432c8b1a92d6a230b762bc6d831b486de132c4d4 --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 15.187891510159636, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.2005340847158173}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6089225605030864, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031749506024181815}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4850253270309617, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029712295443402523}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5149400564373232, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002281960188799717}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.3125612676733449, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002807570058211188}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.24520830668256238, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023166169808109976}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.26064964037026866, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002149918786285521}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.45032557438452553, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002995769757075173}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3564750276333542, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002545550505071048}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3791251783681887, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021638392150190966}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5099476065779874, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003210910234266457}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.40596954377109, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002856919494329858}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4311876269636124, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024222285980316075}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_3.json b/8b7178b35b/evaluation/generation/agg.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..9c2cbfb1b4daed66bda6fe26d0faf8c714930022 --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 16.060659394975822, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.17284642655126536}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6148474805598093, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003175147795291498}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4938729679272436, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029612490025592896}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5239878618101873, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022891503962730515}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.32141615003361074, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00284369777288176}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2546854150197406, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023748524797935944}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.27038735747786175, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002196480015942097}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.45482796385524316, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0030285934039142345}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3632799719766207, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025747603467030653}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3858853477225852, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002195201839278644}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5189202264105984, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0032211525451001028}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.41656979202046523, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028606302793073527}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.44212298577697895, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024314611034434628}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_4.json b/8b7178b35b/evaluation/generation/agg.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..c22c14e3275f156661b00978578f201ee244b47b --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 16.35064977606228, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.15318703610951076}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6141579219291876, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031375276423873367}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.49642790420160215, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002890279129158977}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5272948463681918, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002276632828321617}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.3216796674918701, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0028452669990831196}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2567141692534647, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002372105255220152}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2730606307438099, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002234438055141524}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.45388329842280073, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029409250663779253}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.36571295934350256, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025294206995360793}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.38874867977872807, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021952914125996665}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5193905306564236, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031731739172339655}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4201701863764282, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028340856821376906}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.44624941166081916, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024399419515776116}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_5.json b/8b7178b35b/evaluation/generation/agg.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..9fc20424a116201529d7ecabaa5679e6f9c7014d --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 16.33989554218624, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.17192498787094718}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6138887802372733, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003148762043973577}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.49579908715969256, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002855704257905023}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5272012483217712, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022727033449929193}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.32296239014683903, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002836651143474931}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.25721295886814427, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023323863742251865}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2739732304449431, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0022083117263179994}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4557756119232901, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002957529253678058}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.36723275796263094, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002545583277155397}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.39053942113540757, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0022084680095602566}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.520413988660044, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003202124211985598}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.41985936033161986, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002793790259009851}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.44667560043167237, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002425231007898886}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.global_step84877_gem_xsum_article_DOC_summary_0.json b/8b7178b35b/evaluation/generation/agg.global_step84877_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..df0e2e4b880e657142f2a6a0a58cb963179b95ce --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.global_step84877_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.14704474756783373, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00260243994472115}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3179426585120001, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005091359061361595}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.19497689185235167, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003037459759774}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.033133611529725375, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0012222134099385885}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07643755617885226, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002852925969928893}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04545175235793978, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0016613895167432173}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10872152825582168, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0020985136406316504}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.23420658227277613, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0038579727721169913}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14329622002037548, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002251083734524946}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.11878580563146314, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0022791200374934033}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2561567987942721, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004250537243559008}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.15671768300152755, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024938518539829066}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.9172897233734647, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07612979258741162}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.global_step84877_gem_xsum_article_DOC_summary_1.json b/8b7178b35b/evaluation/generation/agg.global_step84877_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..71252d3f2b0ac9e56f55006863538b7205079ab0 --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.global_step84877_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.2506117820029391, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004197193925421806}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.265051427357207, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004113838412416427}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.2429048922678839, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0035470294629619853}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.059355725931601024, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026146656506255265}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06240115907434781, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002528707836330792}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.05697362472735911, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002319852424027265}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.18675397233452354, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003437969762757092}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.19744938072178414, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0033460143453592026}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1806939148235656, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002897868234740968}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.18896297297256576, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003436743475620793}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.20147068575801652, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0034574795296360844}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.18340626109421165, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002921137289513508}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.9617243214867686, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.2121625238447871}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/agg.global_step84877_gem_xsum_article_DOC_summary_2.json b/8b7178b35b/evaluation/generation/agg.global_step84877_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..c126ae130f1384a4432244e07d0f1e189a1e0ad8 --- /dev/null +++ b/8b7178b35b/evaluation/generation/agg.global_step84877_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.2862450933885503, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0042447208222623255}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2741637614630613, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0038690227267741645}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.2684969037756941, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003538515661007479}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.07370429393444561, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002782856999759695}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07014627514180007, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002596637645417416}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.06850101702956525, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002469575816155894}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.21544246954500543, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003580176542199536}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.20674126511922747, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0032887383484612206}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.20209449252255896, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003025686120342655}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.21658328451330233, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003567997453456091}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2083566653493878, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0032948366397107273}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.20333325134792413, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0030149542501899957}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 3.790180948775114, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.21949698226608796}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_0.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6434372ed513b21e4241e6250b2a566a937c31dc --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55a86ef36f359ac9d5aa94074b05a9d9549239703765b858e39506d7efd2c562 +size 3928411 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_1.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..010eebeb3c6cf3cf56e5e1b4f3e9776c67e02419 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9af5a5a8825e609c982ee918b122927cc29f2101679cef30797eea2334eccfbe +size 4708949 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_2.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b11d1ffba06e707b05dee2a535d54ade62466f90 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dacd76c8bf7945ffbfc5381d1455b0bdd727f305b176465b806b9b46dbccbaf +size 5601657 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_3.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..47aee388443ab5b45088b77b7c840593e05cb68f --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83d9d9cc4619824551b3d217dfbfae94a54feac83cb452c5c310d37db929d1c1 +size 6516902 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_4.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..47240dcbb2d2e4709a55dfe0d078ea5e246fda94 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1157819717a80d400dc74bfa366a7e280b39a993898e4035c8bd59132bf00a3d +size 7410174 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_5.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7d3143ed62b692dc45c91469c52335d04e584a73 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9976e84bc3c92fde4af04c683df1b67d6ffa996d26311d778feef1834e84b3bb +size 8299847 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_0.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f238e31178fa8b02ef57bd78ffc322f4512dc9fa --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ec8bfdfcc8cf0b42f32ad779cb05aed44821eb68d4dc722df3bc3c35801e871 +size 7500005 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_1.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..46a4bf2cd6e18e1298fcd731d7fb10aa211ca9d6 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92a30318e190a48cf0a56a605af43b599d304b2347acf6f7eb0758209cdb7670 +size 13010230 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_2.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_3.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_4.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_5.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0cfd70dcf87678d524e7f910b285b5c739d16a70 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a93e3fa7c1124d18aa8bf18eabc6dccaab044b1d7ccf77b919b53790ebf21d4c +size 4413579 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..848a95351dfced75706e60419a683174c4d6b295 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42a1bad4ab91299b0269e5573e0bc6846be1ce4355f7c50de29a41a6515c3cdc +size 4997641 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..bdc21dc7093971f98bd0696e83ecbe094569a36b --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d85870c0bc245d836206edc8c50d3b4f487720aabd445e64bbaf90e9fbf44959 +size 6096223 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1293abce10bb62e169d08a7bc0052b05b510bc51 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b743ac4483db234fb1abe8b5aeadbb04638e9b680d9d118994e1908ec3d9ba30 +size 7179999 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..be4e0989eaf266ce708b946fb8b39b175b4b4740 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd5159fc6288c094f7575cb78553aea65f897bf1f2f38e36a8cab1801eecf7bb +size 8259167 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..357d71b502d6917638df26afd5cc28c441a39d82 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa2270875a1f1622ea954bac17a8e64829db07972ec52142179b30ee55722833 +size 9345831 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_0.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..72f868f4e03b17582bb101648ef402e9f1de0c06 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d80d2e6afd67ccaa9cb7d4bd9a05ffb919b0ed276527dfac79e91b9bcd79263 +size 2792796 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_1.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..09f3028bd38a936279947980b8b45b621a2cb4ca --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64d4303d8d29bf9f8556b4da7a88b4f176517b6916c4ed920c9e6c8fcd7b9aa0 +size 4925541 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_2.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3b5fb4eddbe2292a074340b08aca2c8b7fdd0692 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cf7feaa75b646454ddcc96165d9158ac3239d7537e46df91eebebc14afd8a13 +size 7177694 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_3.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_4.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_5.jsonl b/8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_0.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6434372ed513b21e4241e6250b2a566a937c31dc --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55a86ef36f359ac9d5aa94074b05a9d9549239703765b858e39506d7efd2c562 +size 3928411 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_1.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..010eebeb3c6cf3cf56e5e1b4f3e9776c67e02419 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9af5a5a8825e609c982ee918b122927cc29f2101679cef30797eea2334eccfbe +size 4708949 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_2.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b11d1ffba06e707b05dee2a535d54ade62466f90 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dacd76c8bf7945ffbfc5381d1455b0bdd727f305b176465b806b9b46dbccbaf +size 5601657 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_3.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..47aee388443ab5b45088b77b7c840593e05cb68f --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83d9d9cc4619824551b3d217dfbfae94a54feac83cb452c5c310d37db929d1c1 +size 6516902 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_4.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..47240dcbb2d2e4709a55dfe0d078ea5e246fda94 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1157819717a80d400dc74bfa366a7e280b39a993898e4035c8bd59132bf00a3d +size 7410174 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_5.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7d3143ed62b692dc45c91469c52335d04e584a73 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9976e84bc3c92fde4af04c683df1b67d6ffa996d26311d778feef1834e84b3bb +size 8299847 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-wiki_lingua_en_tldr_en_0.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f238e31178fa8b02ef57bd78ffc322f4512dc9fa --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ec8bfdfcc8cf0b42f32ad779cb05aed44821eb68d4dc722df3bc3c35801e871 +size 7500005 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-wiki_lingua_en_tldr_en_1.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..46a4bf2cd6e18e1298fcd731d7fb10aa211ca9d6 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92a30318e190a48cf0a56a605af43b599d304b2347acf6f7eb0758209cdb7670 +size 13010230 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-wiki_lingua_en_tldr_en_2.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-wiki_lingua_en_tldr_en_3.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-wiki_lingua_en_tldr_en_4.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-wiki_lingua_en_tldr_en_5.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0cfd70dcf87678d524e7f910b285b5c739d16a70 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a93e3fa7c1124d18aa8bf18eabc6dccaab044b1d7ccf77b919b53790ebf21d4c +size 4413579 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..848a95351dfced75706e60419a683174c4d6b295 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42a1bad4ab91299b0269e5573e0bc6846be1ce4355f7c50de29a41a6515c3cdc +size 4997641 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..bdc21dc7093971f98bd0696e83ecbe094569a36b --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d85870c0bc245d836206edc8c50d3b4f487720aabd445e64bbaf90e9fbf44959 +size 6096223 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1293abce10bb62e169d08a7bc0052b05b510bc51 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b743ac4483db234fb1abe8b5aeadbb04638e9b680d9d118994e1908ec3d9ba30 +size 7179999 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..be4e0989eaf266ce708b946fb8b39b175b4b4740 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd5159fc6288c094f7575cb78553aea65f897bf1f2f38e36a8cab1801eecf7bb +size 8259167 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..357d71b502d6917638df26afd5cc28c441a39d82 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa2270875a1f1622ea954bac17a8e64829db07972ec52142179b30ee55722833 +size 9345831 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_0.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..72f868f4e03b17582bb101648ef402e9f1de0c06 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d80d2e6afd67ccaa9cb7d4bd9a05ffb919b0ed276527dfac79e91b9bcd79263 +size 2792796 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_1.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..09f3028bd38a936279947980b8b45b621a2cb4ca --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64d4303d8d29bf9f8556b4da7a88b4f176517b6916c4ed920c9e6c8fcd7b9aa0 +size 4925541 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_2.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3b5fb4eddbe2292a074340b08aca2c8b7fdd0692 --- /dev/null +++ b/8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cf7feaa75b646454ddcc96165d9158ac3239d7537e46df91eebebc14afd8a13 +size 7177694 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_3.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_4.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_5.jsonl b/8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b35b/evaluation/generation/merged.csv b/8b7178b35b/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..94e96839377380f1faa8ddf2dbeb12c2d127e226 --- /dev/null +++ b/8b7178b35b/evaluation/generation/merged.csv @@ -0,0 +1,39 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.07297635058372318 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.07297635058372318 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.23224231794118463 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.23224231794118463 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.26064964037026866 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.26064964037026866 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.27038735747786175 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.27038735747786175 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.2730606307438099 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.2730606307438099 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.2739732304449431 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.2739732304449431 +e2e_nlg_cleaned,5,average,multiple,0.23054825459363187 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.04545175235793978 +gem_xsum,0,median,rouge2_fmeasure,0.04545175235793978 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.05697362472735911 +gem_xsum,1,median,rouge2_fmeasure,0.05697362472735911 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.06850101702956525 +gem_xsum,2,median,rouge2_fmeasure,0.06850101702956525 +gem_xsum,2,average,multiple,0.056975464704954716 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.05172430149730381 +web_nlg_en,0,median,rouge2_fmeasure,0.05172430149730381 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.0838728953683248 +web_nlg_en,1,median,rouge2_fmeasure,0.0838728953683248 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.10468204406915697 +web_nlg_en,2,median,rouge2_fmeasure,0.10468204406915697 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.10711581894262515 +web_nlg_en,3,median,rouge2_fmeasure,0.10711581894262515 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.10880911597097326 +web_nlg_en,4,median,rouge2_fmeasure,0.10880911597097326 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.11565656452634464 +web_nlg_en,5,median,rouge2_fmeasure,0.11565656452634464 +web_nlg_en,5,average,multiple,0.09531012339578811 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.049529716403418626 +wiki_lingua_en,0,median,rouge2_fmeasure,0.049529716403418626 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.04749462077218236 +wiki_lingua_en,1,median,rouge2_fmeasure,0.04749462077218236 +wiki_lingua_en,1,average,multiple,0.0485121685878005 diff --git a/8b7178b35b/evaluation/generation/merged.json b/8b7178b35b/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..2091ecf15b978177515d491c0194e18f74193615 --- /dev/null +++ b/8b7178b35b/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.347289354458488, "bleu_stderr": 0.03777797007924809, "rouge1_fmeasure": 0.10890954353426278, "rouge1_fmeasure_stderr": 0.002110258935484955, "rouge1_precision": 0.079226368742227, "rouge1_precision_stderr": 0.0023231969845277887, "rouge1_recall": 0.28110828630725015, "rouge1_recall_stderr": 0.004882004381200993, "rouge2_fmeasure": 0.05172430149730381, "rouge2_fmeasure_stderr": 0.0013180585408877222, "rouge2_precision": 0.03743726607123581, "rouge2_precision_stderr": 0.001494228694268955, "rouge2_recall": 0.13690374884005102, "rouge2_recall_stderr": 0.003169133187878269, "rougeL_fmeasure": 0.10554978776184795, "rougeL_fmeasure_stderr": 0.0020007799763877027, "rougeL_precision": 0.07666350308702279, "rougeL_precision_stderr": 0.0022367957170880146, "rougeL_recall": 0.2745019482026448, "rougeL_recall_stderr": 0.004789753920178336, "rougeLsum_fmeasure": 0.10411236694388043, "rougeLsum_fmeasure_stderr": 0.0019983020211639833, "rougeLsum_precision": 0.07592638133051025, "rougeLsum_precision_stderr": 0.002251359653603086, "rougeLsum_recall": 0.2686557447211624, "rougeLsum_recall_stderr": 0.004613052990575398}}, "1": {"PALM_prompt": {"bleu": 0.5749625372797772, "bleu_stderr": 0.042168587225678913, "rouge1_fmeasure": 0.1639618887300654, "rouge1_fmeasure_stderr": 0.003768473720694237, "rouge1_precision": 0.1384507797063748, "rouge1_precision_stderr": 0.004372707845611215, "rouge1_recall": 0.322644364844527, "rouge1_recall_stderr": 0.004855940304467451, "rouge2_fmeasure": 0.0838728953683248, "rouge2_fmeasure_stderr": 0.002551976059024005, "rouge2_precision": 0.0725164426950792, "rouge2_precision_stderr": 0.0030197107273513208, "rouge2_recall": 0.16687390506721525, "rouge2_recall_stderr": 0.0035088962671374286, "rougeL_fmeasure": 0.14973459838273895, "rougeL_fmeasure_stderr": 0.003227143648327153, "rougeL_precision": 0.12455299793053924, "rougeL_precision_stderr": 0.0037936801945088155, "rougeL_recall": 0.3050028170207448, "rougeL_recall_stderr": 0.004518320595879189, "rougeLsum_fmeasure": 0.15125353657464896, "rougeLsum_fmeasure_stderr": 0.0032779530465988412, "rougeLsum_precision": 0.1263163648899627, "rougeLsum_precision_stderr": 0.0038597130269363692, "rougeLsum_recall": 0.3062159795615415, "rougeLsum_recall_stderr": 0.004522396040564721}}, "2": {"PALM_prompt": {"bleu": 0.6896289267842831, "bleu_stderr": 0.04363432869368013, "rouge1_fmeasure": 0.19577491362940544, "rouge1_fmeasure_stderr": 0.004183820712066921, "rouge1_precision": 0.1736763143186271, "rouge1_precision_stderr": 0.005190144069158226, "rouge1_recall": 0.3690495199973296, "rouge1_recall_stderr": 0.004674550419980399, "rouge2_fmeasure": 0.10468204406915697, "rouge2_fmeasure_stderr": 0.002958633901985044, "rouge2_precision": 0.09630923485520457, "rouge2_precision_stderr": 0.003591484421705004, "rouge2_recall": 0.19774238776363945, "rouge2_recall_stderr": 0.0036773455774089777, "rougeL_fmeasure": 0.17655301985743188, "rougeL_fmeasure_stderr": 0.003543990303517691, "rougeL_precision": 0.15346964126360133, "rougeL_precision_stderr": 0.004394358403285555, "rougeL_recall": 0.34605615384304983, "rougeL_recall_stderr": 0.0043553659806620975, "rougeLsum_fmeasure": 0.17970682314011696, "rougeLsum_fmeasure_stderr": 0.003629660902642662, "rougeLsum_precision": 0.15737438288230765, "rougeLsum_precision_stderr": 0.004551780258151066, "rougeLsum_recall": 0.34891501370883077, "rougeLsum_recall_stderr": 0.004358767783710016}}, "3": {"PALM_prompt": {"bleu": 0.7168649256709774, "bleu_stderr": 0.04675221435801664, "rouge1_fmeasure": 0.20039314889286589, "rouge1_fmeasure_stderr": 0.00433393844787534, "rouge1_precision": 0.1766984056786614, "rouge1_precision_stderr": 0.0052889863501627, "rouge1_recall": 0.3784023798729607, "rouge1_recall_stderr": 0.004834949146967397, "rouge2_fmeasure": 0.10711581894262515, "rouge2_fmeasure_stderr": 0.00302754276771825, "rouge2_precision": 0.09764044765164406, "rouge2_precision_stderr": 0.0036619448797318528, "rouge2_recall": 0.2030335209107597, "rouge2_recall_stderr": 0.003804312974743258, "rougeL_fmeasure": 0.18005823477527308, "rougeL_fmeasure_stderr": 0.003625480259314596, "rougeL_precision": 0.15566438191020568, "rougeL_precision_stderr": 0.004489975630701125, "rougeL_recall": 0.3537310697482285, "rougeL_recall_stderr": 0.004433439714918285, "rougeLsum_fmeasure": 0.18404319632429025, "rougeLsum_fmeasure_stderr": 0.0037645994118713916, "rougeLsum_precision": 0.1606361822943105, "rougeLsum_precision_stderr": 0.004693428623221418, "rougeLsum_recall": 0.3571516509838202, "rougeLsum_recall_stderr": 0.004469628307077723}}, "4": {"PALM_prompt": {"bleu": 0.8264767377736691, "bleu_stderr": 0.053779296385247366, "rouge1_fmeasure": 0.20221675887809062, "rouge1_fmeasure_stderr": 0.004283401665288551, "rouge1_precision": 0.1812068418232479, "rouge1_precision_stderr": 0.005398716331751978, "rouge1_recall": 0.38369035451056227, "rouge1_recall_stderr": 0.00470013713630282, "rouge2_fmeasure": 0.10880911597097326, "rouge2_fmeasure_stderr": 0.0029539167777379253, "rouge2_precision": 0.1006261222318028, "rouge2_precision_stderr": 0.0036927051039995647, "rouge2_recall": 0.2074416749104224, "rouge2_recall_stderr": 0.0036680698832641224, "rougeL_fmeasure": 0.18068778740178215, "rougeL_fmeasure_stderr": 0.0035531966464061853, "rougeL_precision": 0.15862122681407606, "rougeL_precision_stderr": 0.004530792062039435, "rougeL_recall": 0.35743845572365024, "rougeL_recall_stderr": 0.004293662429385583, "rougeLsum_fmeasure": 0.185234182101754, "rougeLsum_fmeasure_stderr": 0.00371289144584664, "rougeLsum_precision": 0.16438209047726673, "rougeLsum_precision_stderr": 0.004775185780341334, "rougeLsum_recall": 0.3611996661245711, "rougeLsum_recall_stderr": 0.00431294873519373}}, "5": {"PALM_prompt": {"bleu": 0.8765489182001927, "bleu_stderr": 0.040019456401903304, "rouge1_fmeasure": 0.20880684983729342, "rouge1_fmeasure_stderr": 0.004530179904806841, "rouge1_precision": 0.1926905497088421, "rouge1_precision_stderr": 0.0057538188799125855, "rouge1_recall": 0.3858328625547419, "rouge1_recall_stderr": 0.004823164304577201, "rouge2_fmeasure": 0.11565656452634464, "rouge2_fmeasure_stderr": 0.003314764756228703, "rouge2_precision": 0.11101027585585174, "rouge2_precision_stderr": 0.004140682260724748, "rouge2_recall": 0.21158156307350992, "rouge2_recall_stderr": 0.003943074328986311, "rougeL_fmeasure": 0.18694354311801048, "rougeL_fmeasure_stderr": 0.0038293768377802495, "rougeL_precision": 0.16975713372550302, "rougeL_precision_stderr": 0.0049633182199218225, "rougeL_recall": 0.3591348058816613, "rougeL_recall_stderr": 0.004445791053730718, "rougeLsum_fmeasure": 0.1915290665625795, "rougeLsum_fmeasure_stderr": 0.00396816747113494, "rougeLsum_precision": 0.17553725023286618, "rougeLsum_precision_stderr": 0.005177574879953629, "rougeLsum_recall": 0.36311828129199303, "rougeLsum_recall_stderr": 0.0044570305199087895}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 3.586033759423314, "bleu_stderr": 0.09221854298529836, "rouge1_fmeasure": 0.18563962193300107, "rouge1_fmeasure_stderr": 0.00254964484535964, "rouge1_precision": 0.1716696703091672, "rouge1_precision_stderr": 0.0028501359020609955, "rouge1_recall": 0.25185497103999677, "rouge1_recall_stderr": 0.0034752671023028777, "rouge2_fmeasure": 0.049529716403418626, "rouge2_fmeasure_stderr": 0.001152868080944952, "rouge2_precision": 0.04455795738149438, "rouge2_precision_stderr": 0.0011159745679413468, "rouge2_recall": 0.06850978198098658, "rouge2_recall_stderr": 0.0017237693104594396, "rougeL_fmeasure": 0.13995045719718288, "rougeL_fmeasure_stderr": 0.0018763707447302035, "rougeL_precision": 0.1292734642683531, "rougeL_precision_stderr": 0.0022188669387071605, "rougeL_recall": 0.1943570396317403, "rougeL_recall_stderr": 0.0027761702028766522, "rougeLsum_fmeasure": 0.17363683324091103, "rougeLsum_fmeasure_stderr": 0.0023982582496962375, "rougeLsum_precision": 0.1610229468194331, "rougeLsum_precision_stderr": 0.002727168940548498, "rougeLsum_recall": 0.2357960382787708, "rougeLsum_recall_stderr": 0.0032789217359646683}}, "1": {"tldr_en": {"bleu": 3.0885083531376645, "bleu_stderr": 0.09894775701896347, "rouge1_fmeasure": 0.18742769556123198, "rouge1_fmeasure_stderr": 0.0024179522944743578, "rouge1_precision": 0.22141486924288373, "rouge1_precision_stderr": 0.003489092311505774, "rouge1_recall": 0.21774103131853748, "rouge1_recall_stderr": 0.003219238261544544, "rouge2_fmeasure": 0.04749462077218236, "rouge2_fmeasure_stderr": 0.0013391994596319457, "rouge2_precision": 0.05911494441028749, "rouge2_precision_stderr": 0.001977492552657427, "rouge2_recall": 0.056021987595245265, "rouge2_recall_stderr": 0.0016925719239639409, "rougeL_fmeasure": 0.14177658902154563, "rougeL_fmeasure_stderr": 0.0018452092691051947, "rougeL_precision": 0.17052813755243684, "rougeL_precision_stderr": 0.0028543436290086777, "rougeL_recall": 0.16498921391985125, "rougeL_recall_stderr": 0.0024957799702815765, "rougeLsum_fmeasure": 0.17566654570551468, "rougeLsum_fmeasure_stderr": 0.0022619479293200127, "rougeLsum_precision": 0.20843084756852662, "rougeLsum_precision_stderr": 0.003321140474934239, "rougeLsum_recall": 0.20397276049127364, "rougeLsum_recall_stderr": 0.0030133958209501476}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 3.8008125605460465, "bleu_stderr": 0.08334728702857473, "rouge1_fmeasure": 0.2613118947613821, "rouge1_fmeasure_stderr": 0.002127912583794242, "rouge1_precision": 0.2090865590305055, "rouge1_precision_stderr": 0.0018470177010718961, "rouge1_recall": 0.38188549726437987, "rouge1_recall_stderr": 0.003279728734456605, "rouge2_fmeasure": 0.07297635058372318, "rouge2_fmeasure_stderr": 0.001261248605220041, "rouge2_precision": 0.05673694028468428, "rouge2_precision_stderr": 0.0009833704090490367, "rouge2_recall": 0.1101409383371642, "rouge2_recall_stderr": 0.001995492794975982, "rougeL_fmeasure": 0.22836186321205557, "rougeL_fmeasure_stderr": 0.0015605125797972495, "rougeL_precision": 0.18275732889261928, "rougeL_precision_stderr": 0.0013921067012969746, "rougeL_recall": 0.3338079929800571, "rougeL_recall_stderr": 0.0024505755903694226, "rougeLsum_fmeasure": 0.21899459401932223, "rougeLsum_fmeasure_stderr": 0.002102657843438912, "rougeLsum_precision": 0.17512630400560542, "rougeLsum_precision_stderr": 0.0017783983400275266, "rougeLsum_recall": 0.32141092125405557, "rougeLsum_recall_stderr": 0.0032662985068743528}}, "1": {"generate_text_restaurant": {"bleu": 12.455563496168116, "bleu_stderr": 0.15428951986028144, "rouge1_fmeasure": 0.4844618589871223, "rouge1_fmeasure_stderr": 0.002388878380866762, "rouge1_precision": 0.5954981850070853, "rouge1_precision_stderr": 0.0032755377697093577, "rouge1_recall": 0.44832902186902923, "rouge1_recall_stderr": 0.0030688387452721486, "rouge2_fmeasure": 0.23224231794118463, "rouge2_fmeasure_stderr": 0.0020931392807158806, "rouge2_precision": 0.29040989982948295, "rouge2_precision_stderr": 0.0028204861869818784, "rouge2_recall": 0.21450317916657013, "rouge2_recall_stderr": 0.002222395267553394, "rougeL_fmeasure": 0.34990734371381305, "rougeL_fmeasure_stderr": 0.0021300316703662904, "rougeL_precision": 0.43368332329208353, "rougeL_precision_stderr": 0.003056248156608264, "rougeL_recall": 0.32270327842717356, "rougeL_recall_stderr": 0.0024894724353540653, "rougeLsum_fmeasure": 0.39499604706438096, "rougeLsum_fmeasure_stderr": 0.0023754095690034817, "rougeLsum_precision": 0.48684291022612447, "rougeLsum_precision_stderr": 0.0032370809243618716, "rougeLsum_recall": 0.3651475528395549, "rougeLsum_recall_stderr": 0.002807567486848305}}, "2": {"generate_text_restaurant": {"bleu": 15.187891510159636, "bleu_stderr": 0.2005340847158173, "rouge1_fmeasure": 0.5149400564373232, "rouge1_fmeasure_stderr": 0.002281960188799717, "rouge1_precision": 0.6089225605030864, "rouge1_precision_stderr": 0.0031749506024181815, "rouge1_recall": 0.4850253270309617, "rouge1_recall_stderr": 0.0029712295443402523, "rouge2_fmeasure": 0.26064964037026866, "rouge2_fmeasure_stderr": 0.002149918786285521, "rouge2_precision": 0.3125612676733449, "rouge2_precision_stderr": 0.002807570058211188, "rouge2_recall": 0.24520830668256238, "rouge2_recall_stderr": 0.0023166169808109976, "rougeL_fmeasure": 0.3791251783681887, "rougeL_fmeasure_stderr": 0.0021638392150190966, "rougeL_precision": 0.45032557438452553, "rougeL_precision_stderr": 0.002995769757075173, "rougeL_recall": 0.3564750276333542, "rougeL_recall_stderr": 0.002545550505071048, "rougeLsum_fmeasure": 0.4311876269636124, "rougeLsum_fmeasure_stderr": 0.0024222285980316075, "rougeLsum_precision": 0.5099476065779874, "rougeLsum_precision_stderr": 0.003210910234266457, "rougeLsum_recall": 0.40596954377109, "rougeLsum_recall_stderr": 0.002856919494329858}}, "3": {"generate_text_restaurant": {"bleu": 16.060659394975822, "bleu_stderr": 0.17284642655126536, "rouge1_fmeasure": 0.5239878618101873, "rouge1_fmeasure_stderr": 0.0022891503962730515, "rouge1_precision": 0.6148474805598093, "rouge1_precision_stderr": 0.003175147795291498, "rouge1_recall": 0.4938729679272436, "rouge1_recall_stderr": 0.0029612490025592896, "rouge2_fmeasure": 0.27038735747786175, "rouge2_fmeasure_stderr": 0.002196480015942097, "rouge2_precision": 0.32141615003361074, "rouge2_precision_stderr": 0.00284369777288176, "rouge2_recall": 0.2546854150197406, "rouge2_recall_stderr": 0.0023748524797935944, "rougeL_fmeasure": 0.3858853477225852, "rougeL_fmeasure_stderr": 0.002195201839278644, "rougeL_precision": 0.45482796385524316, "rougeL_precision_stderr": 0.0030285934039142345, "rougeL_recall": 0.3632799719766207, "rougeL_recall_stderr": 0.0025747603467030653, "rougeLsum_fmeasure": 0.44212298577697895, "rougeLsum_fmeasure_stderr": 0.0024314611034434628, "rougeLsum_precision": 0.5189202264105984, "rougeLsum_precision_stderr": 0.0032211525451001028, "rougeLsum_recall": 0.41656979202046523, "rougeLsum_recall_stderr": 0.0028606302793073527}}, "4": {"generate_text_restaurant": {"bleu": 16.35064977606228, "bleu_stderr": 0.15318703610951076, "rouge1_fmeasure": 0.5272948463681918, "rouge1_fmeasure_stderr": 0.002276632828321617, "rouge1_precision": 0.6141579219291876, "rouge1_precision_stderr": 0.0031375276423873367, "rouge1_recall": 0.49642790420160215, "rouge1_recall_stderr": 0.002890279129158977, "rouge2_fmeasure": 0.2730606307438099, "rouge2_fmeasure_stderr": 0.002234438055141524, "rouge2_precision": 0.3216796674918701, "rouge2_precision_stderr": 0.0028452669990831196, "rouge2_recall": 0.2567141692534647, "rouge2_recall_stderr": 0.002372105255220152, "rougeL_fmeasure": 0.38874867977872807, "rougeL_fmeasure_stderr": 0.0021952914125996665, "rougeL_precision": 0.45388329842280073, "rougeL_precision_stderr": 0.0029409250663779253, "rougeL_recall": 0.36571295934350256, "rougeL_recall_stderr": 0.0025294206995360793, "rougeLsum_fmeasure": 0.44624941166081916, "rougeLsum_fmeasure_stderr": 0.0024399419515776116, "rougeLsum_precision": 0.5193905306564236, "rougeLsum_precision_stderr": 0.0031731739172339655, "rougeLsum_recall": 0.4201701863764282, "rougeLsum_recall_stderr": 0.0028340856821376906}}, "5": {"generate_text_restaurant": {"bleu": 16.33989554218624, "bleu_stderr": 0.17192498787094718, "rouge1_fmeasure": 0.5272012483217712, "rouge1_fmeasure_stderr": 0.0022727033449929193, "rouge1_precision": 0.6138887802372733, "rouge1_precision_stderr": 0.003148762043973577, "rouge1_recall": 0.49579908715969256, "rouge1_recall_stderr": 0.002855704257905023, "rouge2_fmeasure": 0.2739732304449431, "rouge2_fmeasure_stderr": 0.0022083117263179994, "rouge2_precision": 0.32296239014683903, "rouge2_precision_stderr": 0.002836651143474931, "rouge2_recall": 0.25721295886814427, "rouge2_recall_stderr": 0.0023323863742251865, "rougeL_fmeasure": 0.39053942113540757, "rougeL_fmeasure_stderr": 0.0022084680095602566, "rougeL_precision": 0.4557756119232901, "rougeL_precision_stderr": 0.002957529253678058, "rougeL_recall": 0.36723275796263094, "rougeL_recall_stderr": 0.002545583277155397, "rougeLsum_fmeasure": 0.44667560043167237, "rougeLsum_fmeasure_stderr": 0.002425231007898886, "rougeLsum_precision": 0.520413988660044, "rougeLsum_precision_stderr": 0.003202124211985598, "rougeLsum_recall": 0.41985936033161986, "rougeLsum_recall_stderr": 0.002793790259009851}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 1.9172897233734647, "bleu_stderr": 0.07612979258741162, "rouge1_fmeasure": 0.19497689185235167, "rouge1_fmeasure_stderr": 0.003037459759774, "rouge1_precision": 0.14704474756783373, "rouge1_precision_stderr": 0.00260243994472115, "rouge1_recall": 0.3179426585120001, "rouge1_recall_stderr": 0.005091359061361595, "rouge2_fmeasure": 0.04545175235793978, "rouge2_fmeasure_stderr": 0.0016613895167432173, "rouge2_precision": 0.033133611529725375, "rouge2_precision_stderr": 0.0012222134099385885, "rouge2_recall": 0.07643755617885226, "rouge2_recall_stderr": 0.002852925969928893, "rougeL_fmeasure": 0.14329622002037548, "rougeL_fmeasure_stderr": 0.002251083734524946, "rougeL_precision": 0.10872152825582168, "rougeL_precision_stderr": 0.0020985136406316504, "rougeL_recall": 0.23420658227277613, "rougeL_recall_stderr": 0.0038579727721169913, "rougeLsum_fmeasure": 0.15671768300152755, "rougeLsum_fmeasure_stderr": 0.0024938518539829066, "rougeLsum_precision": 0.11878580563146314, "rougeLsum_precision_stderr": 0.0022791200374934033, "rougeLsum_recall": 0.2561567987942721, "rougeLsum_recall_stderr": 0.004250537243559008}}, "1": {"article_DOC_summary": {"bleu": 2.9617243214867686, "bleu_stderr": 0.2121625238447871, "rouge1_fmeasure": 0.2429048922678839, "rouge1_fmeasure_stderr": 0.0035470294629619853, "rouge1_precision": 0.2506117820029391, "rouge1_precision_stderr": 0.004197193925421806, "rouge1_recall": 0.265051427357207, "rouge1_recall_stderr": 0.004113838412416427, "rouge2_fmeasure": 0.05697362472735911, "rouge2_fmeasure_stderr": 0.002319852424027265, "rouge2_precision": 0.059355725931601024, "rouge2_precision_stderr": 0.0026146656506255265, "rouge2_recall": 0.06240115907434781, "rouge2_recall_stderr": 0.002528707836330792, "rougeL_fmeasure": 0.1806939148235656, "rougeL_fmeasure_stderr": 0.002897868234740968, "rougeL_precision": 0.18675397233452354, "rougeL_precision_stderr": 0.003437969762757092, "rougeL_recall": 0.19744938072178414, "rougeL_recall_stderr": 0.0033460143453592026, "rougeLsum_fmeasure": 0.18340626109421165, "rougeLsum_fmeasure_stderr": 0.002921137289513508, "rougeLsum_precision": 0.18896297297256576, "rougeLsum_precision_stderr": 0.003436743475620793, "rougeLsum_recall": 0.20147068575801652, "rougeLsum_recall_stderr": 0.0034574795296360844}}, "2": {"article_DOC_summary": {"bleu": 3.790180948775114, "bleu_stderr": 0.21949698226608796, "rouge1_fmeasure": 0.2684969037756941, "rouge1_fmeasure_stderr": 0.003538515661007479, "rouge1_precision": 0.2862450933885503, "rouge1_precision_stderr": 0.0042447208222623255, "rouge1_recall": 0.2741637614630613, "rouge1_recall_stderr": 0.0038690227267741645, "rouge2_fmeasure": 0.06850101702956525, "rouge2_fmeasure_stderr": 0.002469575816155894, "rouge2_precision": 0.07370429393444561, "rouge2_precision_stderr": 0.002782856999759695, "rouge2_recall": 0.07014627514180007, "rouge2_recall_stderr": 0.002596637645417416, "rougeL_fmeasure": 0.20209449252255896, "rougeL_fmeasure_stderr": 0.003025686120342655, "rougeL_precision": 0.21544246954500543, "rougeL_precision_stderr": 0.003580176542199536, "rougeL_recall": 0.20674126511922747, "rougeL_recall_stderr": 0.0032887383484612206, "rougeLsum_fmeasure": 0.20333325134792413, "rougeLsum_fmeasure_stderr": 0.0030149542501899957, "rougeLsum_precision": 0.21658328451330233, "rougeLsum_precision_stderr": 0.003567997453456091, "rougeLsum_recall": 0.2083566653493878, "rougeLsum_recall_stderr": 0.0032948366397107273}}}} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-web_nlg_en_PALM_prompt_0.json b/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e3062ffb9cc12386a201fcd4eb8f9c5f1a94d33e --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.347289354458488, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03777797007924809 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.079226368742227, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0023231969845277887 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.28110828630725015, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004882004381200993 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10890954353426278, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002110258935484955 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03743726607123581, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001494228694268955 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.13690374884005102, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003169133187878269 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05172430149730381, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0013180585408877222 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07666350308702279, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0022367957170880146 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2745019482026448, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004789753920178336 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10554978776184795, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0020007799763877027 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07592638133051025, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002251359653603086 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2686557447211624, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004613052990575398 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10411236694388043, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019983020211639833 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-web_nlg_en_PALM_prompt_1.json b/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..94a799cf02f0f06b9bd216a14afba2425e25bfbe --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5749625372797772, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.042168587225678913 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.1384507797063748, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004372707845611215 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.322644364844527, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004855940304467451 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.1639618887300654, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.003768473720694237 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.0725164426950792, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0030197107273513208 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.16687390506721525, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0035088962671374286 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.0838728953683248, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.002551976059024005 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.12455299793053924, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0037936801945088155 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3050028170207448, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004518320595879189 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.14973459838273895, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003227143648327153 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.1263163648899627, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0038597130269363692 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3062159795615415, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004522396040564721 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.15125353657464896, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0032779530465988412 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-web_nlg_en_PALM_prompt_2.json b/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..8b6881f05203d09c75263824c7e45ae406d7fb50 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6896289267842831, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04363432869368013 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.1736763143186271, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005190144069158226 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3690495199973296, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004674550419980399 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.19577491362940544, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004183820712066921 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.09630923485520457, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.003591484421705004 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.19774238776363945, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0036773455774089777 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.10468204406915697, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.002958633901985044 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.15346964126360133, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004394358403285555 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.34605615384304983, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0043553659806620975 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.17655301985743188, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003543990303517691 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.15737438288230765, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004551780258151066 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.34891501370883077, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004358767783710016 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.17970682314011696, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.003629660902642662 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-web_nlg_en_PALM_prompt_3.json b/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..3b7fe009d3f0481934800fc8cbebac60b98ee7c1 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.7168649256709774, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04675221435801664 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.1766984056786614, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0052889863501627 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3784023798729607, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004834949146967397 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.20039314889286589, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.00433393844787534 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.09764044765164406, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0036619448797318528 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.2030335209107597, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003804312974743258 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.10711581894262515, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00302754276771825 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.15566438191020568, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004489975630701125 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3537310697482285, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004433439714918285 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.18005823477527308, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003625480259314596 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.1606361822943105, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004693428623221418 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3571516509838202, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004469628307077723 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.18404319632429025, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0037645994118713916 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-web_nlg_en_PALM_prompt_4.json b/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..22ead1a274946004d2e26a69b7409b5a7bb55ad2 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.8264767377736691, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.053779296385247366 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.1812068418232479, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005398716331751978 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.38369035451056227, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00470013713630282 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.20221675887809062, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004283401665288551 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.1006261222318028, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0036927051039995647 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.2074416749104224, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0036680698832641224 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.10880911597097326, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0029539167777379253 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.15862122681407606, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004530792062039435 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.35743845572365024, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004293662429385583 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.18068778740178215, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0035531966464061853 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.16438209047726673, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004775185780341334 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3611996661245711, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00431294873519373 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.185234182101754, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00371289144584664 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-web_nlg_en_PALM_prompt_5.json b/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..1308933e071574a004c4b8ee0208581ec405ab69 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.8765489182001927, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.040019456401903304 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.1926905497088421, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0057538188799125855 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3858328625547419, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004823164304577201 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.20880684983729342, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004530179904806841 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.11101027585585174, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.004140682260724748 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.21158156307350992, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003943074328986311 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.11565656452634464, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.003314764756228703 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.16975713372550302, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0049633182199218225 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3591348058816613, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004445791053730718 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.18694354311801048, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0038293768377802495 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.17553725023286618, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.005177574879953629 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.36311828129199303, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0044570305199087895 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1915290665625795, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00396816747113494 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-wiki_lingua_en_tldr_en_0.json b/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e35e8e4703e139b2a74020b89a3f59a74365dfb9 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1716696703091672, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0028501359020609955 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.25185497103999677, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0034752671023028777 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.18563962193300107, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.00254964484535964 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.04455795738149438, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0011159745679413468 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06850978198098658, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0017237693104594396 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.049529716403418626, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001152868080944952 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1292734642683531, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0022188669387071605 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1943570396317403, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0027761702028766522 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13995045719718288, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018763707447302035 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1610229468194331, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002727168940548498 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2357960382787708, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0032789217359646683 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.17363683324091103, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023982582496962375 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.586033759423314, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.09221854298529836 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-wiki_lingua_en_tldr_en_1.json b/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..662f45e139b0ba3c511570fe54aea6eafa3c7873 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.8b7178b35b_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.22141486924288373, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.003489092311505774 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.21774103131853748, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.003219238261544544 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.18742769556123198, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0024179522944743578 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.05911494441028749, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001977492552657427 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.056021987595245265, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016925719239639409 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04749462077218236, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0013391994596319457 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.17052813755243684, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0028543436290086777 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.16498921391985125, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0024957799702815765 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.14177658902154563, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018452092691051947 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.20843084756852662, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.003321140474934239 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.20397276049127364, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0030133958209501476 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.17566654570551468, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022619479293200127 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.0885083531376645, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.09894775701896347 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_0.json b/8b7178b35b/evaluation/generation/slim.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..2d515de6a4d036e955525c60850d1e6a1be78514 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 3.8008125605460465, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.08334728702857473 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.2090865590305055, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0018470177010718961 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.38188549726437987, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.003279728734456605 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.2613118947613821, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002127912583794242 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.05673694028468428, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0009833704090490367 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.1101409383371642, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001995492794975982 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.07297635058372318, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001261248605220041 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.18275732889261928, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0013921067012969746 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3338079929800571, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024505755903694226 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.22836186321205557, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0015605125797972495 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.17512630400560542, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0017783983400275266 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.32141092125405557, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0032662985068743528 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.21899459401932223, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002102657843438912 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_1.json b/8b7178b35b/evaluation/generation/slim.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..856dcdefaff0ab8d98dc7fd82b67ba523b375e0c --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.455563496168116, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.15428951986028144 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5954981850070853, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032755377697093577 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.44832902186902923, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0030688387452721486 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4844618589871223, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002388878380866762 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.29040989982948295, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0028204861869818784 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21450317916657013, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002222395267553394 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.23224231794118463, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020931392807158806 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.43368332329208353, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.003056248156608264 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.32270327842717356, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024894724353540653 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.34990734371381305, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021300316703662904 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.48684291022612447, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0032370809243618716 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3651475528395549, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002807567486848305 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.39499604706438096, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023754095690034817 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_2.json b/8b7178b35b/evaluation/generation/slim.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..49c87014d4ebcd9ffcad95855af6ea9632bfca93 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 15.187891510159636, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.2005340847158173 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6089225605030864, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031749506024181815 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4850253270309617, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029712295443402523 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5149400564373232, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002281960188799717 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.3125612676733449, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002807570058211188 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.24520830668256238, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023166169808109976 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.26064964037026866, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002149918786285521 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.45032557438452553, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002995769757075173 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3564750276333542, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002545550505071048 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3791251783681887, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021638392150190966 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5099476065779874, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003210910234266457 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.40596954377109, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002856919494329858 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4311876269636124, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0024222285980316075 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_3.json b/8b7178b35b/evaluation/generation/slim.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..4ae15e4e8484fa81f86e62b7d2b3a33421150280 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 16.060659394975822, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.17284642655126536 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6148474805598093, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003175147795291498 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4938729679272436, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029612490025592896 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5239878618101873, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022891503962730515 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.32141615003361074, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.00284369777288176 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2546854150197406, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023748524797935944 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.27038735747786175, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002196480015942097 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.45482796385524316, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0030285934039142345 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3632799719766207, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025747603467030653 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3858853477225852, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002195201839278644 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5189202264105984, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0032211525451001028 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.41656979202046523, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0028606302793073527 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.44212298577697895, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0024314611034434628 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_4.json b/8b7178b35b/evaluation/generation/slim.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..74ffbb6b627639900ca592492a5a3af8a49339c4 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 16.35064977606228, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.15318703610951076 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6141579219291876, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031375276423873367 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.49642790420160215, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002890279129158977 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5272948463681918, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002276632828321617 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.3216796674918701, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0028452669990831196 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2567141692534647, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002372105255220152 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2730606307438099, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002234438055141524 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.45388329842280073, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029409250663779253 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.36571295934350256, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025294206995360793 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.38874867977872807, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021952914125996665 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5193905306564236, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031731739172339655 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4201701863764282, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0028340856821376906 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.44624941166081916, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0024399419515776116 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_5.json b/8b7178b35b/evaluation/generation/slim.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..a6085e8ed58573a5e5d9ce604b8a38304b48b565 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.8b7178b35b_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 16.33989554218624, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.17192498787094718 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6138887802372733, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003148762043973577 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.49579908715969256, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002855704257905023 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5272012483217712, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022727033449929193 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.32296239014683903, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002836651143474931 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.25721295886814427, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023323863742251865 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2739732304449431, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0022083117263179994 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4557756119232901, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002957529253678058 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.36723275796263094, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002545583277155397 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.39053942113540757, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0022084680095602566 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.520413988660044, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003202124211985598 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.41985936033161986, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002793790259009851 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.44667560043167237, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002425231007898886 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.8b7178b35b_gem_xsum_article_DOC_summary_0.json b/8b7178b35b/evaluation/generation/slim.8b7178b35b_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..cb17edd68e0545c805f4a13c91116b98368ff7dc --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.8b7178b35b_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.14704474756783373, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.00260243994472115 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3179426585120001, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.005091359061361595 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.19497689185235167, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.003037459759774 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.033133611529725375, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0012222134099385885 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07643755617885226, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002852925969928893 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04545175235793978, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0016613895167432173 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10872152825582168, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0020985136406316504 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.23420658227277613, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0038579727721169913 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14329622002037548, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002251083734524946 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.11878580563146314, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0022791200374934033 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2561567987942721, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.004250537243559008 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.15671768300152755, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0024938518539829066 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.9172897233734647, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07612979258741162 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.8b7178b35b_gem_xsum_article_DOC_summary_1.json b/8b7178b35b/evaluation/generation/slim.8b7178b35b_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..cbc327ecef30fc8a09f2bf96b93e1851e32db9da --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.8b7178b35b_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.2506117820029391, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.004197193925421806 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.265051427357207, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004113838412416427 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.2429048922678839, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0035470294629619853 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.059355725931601024, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0026146656506255265 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06240115907434781, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002528707836330792 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.05697362472735911, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.002319852424027265 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.18675397233452354, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.003437969762757092 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.19744938072178414, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0033460143453592026 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1806939148235656, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002897868234740968 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.18896297297256576, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.003436743475620793 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.20147068575801652, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0034574795296360844 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.18340626109421165, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002921137289513508 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.9617243214867686, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.2121625238447871 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.8b7178b35b_gem_xsum_article_DOC_summary_2.json b/8b7178b35b/evaluation/generation/slim.8b7178b35b_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..ec6df40155c6d08e84eb8152ef0dd8627832a155 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.8b7178b35b_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.2862450933885503, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0042447208222623255 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2741637614630613, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0038690227267741645 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.2684969037756941, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.003538515661007479 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.07370429393444561, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.002782856999759695 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07014627514180007, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002596637645417416 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.06850101702956525, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.002469575816155894 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.21544246954500543, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.003580176542199536 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.20674126511922747, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0032887383484612206 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.20209449252255896, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.003025686120342655 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.21658328451330233, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.003567997453456091 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2083566653493878, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0032948366397107273 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.20333325134792413, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0030149542501899957 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 3.790180948775114, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.21949698226608796 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-web_nlg_en_PALM_prompt_0.json b/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..bd4847ce5234b42b419e23fd2699c180bcaff40f --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.347289354458488, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03777797007924809 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.079226368742227, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0023231969845277887 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.28110828630725015, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004882004381200993 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10890954353426278, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002110258935484955 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03743726607123581, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001494228694268955 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.13690374884005102, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003169133187878269 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05172430149730381, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0013180585408877222 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07666350308702279, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0022367957170880146 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2745019482026448, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004789753920178336 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10554978776184795, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0020007799763877027 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07592638133051025, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002251359653603086 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2686557447211624, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004613052990575398 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10411236694388043, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019983020211639833 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-web_nlg_en_PALM_prompt_1.json b/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..8853212e88257835c923a9d78169f9b5d591a507 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5749625372797772, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.042168587225678913 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.1384507797063748, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004372707845611215 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.322644364844527, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004855940304467451 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.1639618887300654, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.003768473720694237 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.0725164426950792, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0030197107273513208 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.16687390506721525, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0035088962671374286 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.0838728953683248, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.002551976059024005 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.12455299793053924, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0037936801945088155 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3050028170207448, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004518320595879189 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.14973459838273895, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003227143648327153 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.1263163648899627, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0038597130269363692 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3062159795615415, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004522396040564721 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.15125353657464896, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0032779530465988412 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-web_nlg_en_PALM_prompt_2.json b/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..602209bcaa279b023c1ffc9f2511d79f335308ec --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6896289267842831, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04363432869368013 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.1736763143186271, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005190144069158226 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3690495199973296, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004674550419980399 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.19577491362940544, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004183820712066921 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.09630923485520457, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.003591484421705004 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.19774238776363945, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0036773455774089777 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.10468204406915697, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.002958633901985044 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.15346964126360133, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004394358403285555 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.34605615384304983, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0043553659806620975 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.17655301985743188, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003543990303517691 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.15737438288230765, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004551780258151066 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.34891501370883077, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004358767783710016 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.17970682314011696, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.003629660902642662 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-web_nlg_en_PALM_prompt_3.json b/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..4f2088a915c4ed7f599a538db78365a222c73977 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.7168649256709774, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04675221435801664 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.1766984056786614, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0052889863501627 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3784023798729607, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004834949146967397 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.20039314889286589, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.00433393844787534 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.09764044765164406, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0036619448797318528 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.2030335209107597, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003804312974743258 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.10711581894262515, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00302754276771825 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.15566438191020568, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004489975630701125 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3537310697482285, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004433439714918285 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.18005823477527308, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003625480259314596 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.1606361822943105, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004693428623221418 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3571516509838202, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004469628307077723 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.18404319632429025, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0037645994118713916 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-web_nlg_en_PALM_prompt_4.json b/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..e0b8b004eb5194994c49f42c104b4345ce08b88c --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.8264767377736691, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.053779296385247366 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.1812068418232479, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005398716331751978 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.38369035451056227, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00470013713630282 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.20221675887809062, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004283401665288551 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.1006261222318028, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0036927051039995647 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.2074416749104224, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0036680698832641224 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.10880911597097326, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0029539167777379253 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.15862122681407606, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004530792062039435 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.35743845572365024, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004293662429385583 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.18068778740178215, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0035531966464061853 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.16438209047726673, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004775185780341334 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3611996661245711, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00431294873519373 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.185234182101754, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00371289144584664 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-web_nlg_en_PALM_prompt_5.json b/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..224c3cd80d46efee78fba22c712912bfa6e3cbc6 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.8765489182001927, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.040019456401903304 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.1926905497088421, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0057538188799125855 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3858328625547419, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004823164304577201 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.20880684983729342, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004530179904806841 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.11101027585585174, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.004140682260724748 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.21158156307350992, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003943074328986311 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.11565656452634464, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.003314764756228703 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.16975713372550302, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0049633182199218225 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3591348058816613, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004445791053730718 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.18694354311801048, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0038293768377802495 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.17553725023286618, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.005177574879953629 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.36311828129199303, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0044570305199087895 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1915290665625795, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00396816747113494 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-wiki_lingua_en_tldr_en_0.json b/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..154c9f3e537008fb4b3f44517ce2d1633ddf7830 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1716696703091672, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0028501359020609955 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.25185497103999677, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0034752671023028777 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.18563962193300107, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.00254964484535964 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.04455795738149438, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0011159745679413468 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06850978198098658, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0017237693104594396 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.049529716403418626, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001152868080944952 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1292734642683531, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0022188669387071605 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1943570396317403, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0027761702028766522 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13995045719718288, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018763707447302035 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1610229468194331, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002727168940548498 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2357960382787708, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0032789217359646683 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.17363683324091103, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023982582496962375 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.586033759423314, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.09221854298529836 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-wiki_lingua_en_tldr_en_1.json b/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..b1f63ef762c7e2c3315399c0b2f020f650c20f3a --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.global_step84877_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.22141486924288373, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.003489092311505774 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.21774103131853748, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.003219238261544544 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.18742769556123198, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0024179522944743578 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.05911494441028749, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001977492552657427 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.056021987595245265, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016925719239639409 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04749462077218236, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0013391994596319457 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.17052813755243684, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0028543436290086777 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.16498921391985125, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0024957799702815765 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.14177658902154563, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018452092691051947 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.20843084756852662, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.003321140474934239 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.20397276049127364, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0030133958209501476 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.17566654570551468, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022619479293200127 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.0885083531376645, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.09894775701896347 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_0.json b/8b7178b35b/evaluation/generation/slim.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..72169604e6f39b2b1a84a743894b80641c7131ae --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 3.8008125605460465, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.08334728702857473 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.2090865590305055, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0018470177010718961 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.38188549726437987, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.003279728734456605 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.2613118947613821, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002127912583794242 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.05673694028468428, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0009833704090490367 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.1101409383371642, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001995492794975982 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.07297635058372318, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001261248605220041 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.18275732889261928, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0013921067012969746 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3338079929800571, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024505755903694226 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.22836186321205557, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0015605125797972495 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.17512630400560542, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0017783983400275266 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.32141092125405557, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0032662985068743528 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.21899459401932223, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002102657843438912 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_1.json b/8b7178b35b/evaluation/generation/slim.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..184246bf3a6bf7abb0910d7a9b4b50714076e359 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.455563496168116, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.15428951986028144 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5954981850070853, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032755377697093577 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.44832902186902923, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0030688387452721486 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4844618589871223, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002388878380866762 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.29040989982948295, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0028204861869818784 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21450317916657013, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002222395267553394 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.23224231794118463, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020931392807158806 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.43368332329208353, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.003056248156608264 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.32270327842717356, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024894724353540653 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.34990734371381305, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021300316703662904 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.48684291022612447, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0032370809243618716 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3651475528395549, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002807567486848305 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.39499604706438096, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023754095690034817 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_2.json b/8b7178b35b/evaluation/generation/slim.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..01ee620a38481bef48158431e3dd0018f8bf3103 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 15.187891510159636, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.2005340847158173 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6089225605030864, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031749506024181815 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4850253270309617, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029712295443402523 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5149400564373232, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002281960188799717 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.3125612676733449, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002807570058211188 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.24520830668256238, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023166169808109976 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.26064964037026866, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002149918786285521 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.45032557438452553, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002995769757075173 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3564750276333542, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002545550505071048 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3791251783681887, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021638392150190966 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5099476065779874, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003210910234266457 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.40596954377109, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002856919494329858 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4311876269636124, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0024222285980316075 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_3.json b/8b7178b35b/evaluation/generation/slim.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..a0f64709fb6392b6d693cbff1703b550327a28ce --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 16.060659394975822, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.17284642655126536 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6148474805598093, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003175147795291498 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4938729679272436, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029612490025592896 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5239878618101873, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022891503962730515 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.32141615003361074, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.00284369777288176 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2546854150197406, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023748524797935944 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.27038735747786175, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002196480015942097 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.45482796385524316, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0030285934039142345 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3632799719766207, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025747603467030653 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3858853477225852, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002195201839278644 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5189202264105984, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0032211525451001028 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.41656979202046523, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0028606302793073527 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.44212298577697895, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0024314611034434628 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_4.json b/8b7178b35b/evaluation/generation/slim.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..cd91e80c33fdf769dc32714331bd7331bcb90527 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 16.35064977606228, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.15318703610951076 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6141579219291876, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031375276423873367 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.49642790420160215, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002890279129158977 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5272948463681918, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002276632828321617 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.3216796674918701, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0028452669990831196 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2567141692534647, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002372105255220152 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2730606307438099, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002234438055141524 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.45388329842280073, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029409250663779253 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.36571295934350256, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025294206995360793 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.38874867977872807, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021952914125996665 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5193905306564236, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031731739172339655 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4201701863764282, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0028340856821376906 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.44624941166081916, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0024399419515776116 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_5.json b/8b7178b35b/evaluation/generation/slim.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..69240cf9348a54761340bce8e0eeec8d971143ed --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.global_step84877_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 16.33989554218624, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.17192498787094718 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6138887802372733, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003148762043973577 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.49579908715969256, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002855704257905023 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5272012483217712, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022727033449929193 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.32296239014683903, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002836651143474931 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.25721295886814427, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023323863742251865 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2739732304449431, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0022083117263179994 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4557756119232901, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002957529253678058 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.36723275796263094, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002545583277155397 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.39053942113540757, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0022084680095602566 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.520413988660044, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003202124211985598 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.41985936033161986, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002793790259009851 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.44667560043167237, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002425231007898886 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.global_step84877_gem_xsum_article_DOC_summary_0.json b/8b7178b35b/evaluation/generation/slim.global_step84877_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..63e28828b7d53c1d5000450b494c0e2fcf1a9922 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.global_step84877_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.14704474756783373, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.00260243994472115 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3179426585120001, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.005091359061361595 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.19497689185235167, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.003037459759774 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.033133611529725375, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0012222134099385885 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07643755617885226, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002852925969928893 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04545175235793978, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0016613895167432173 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10872152825582168, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0020985136406316504 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.23420658227277613, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0038579727721169913 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14329622002037548, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002251083734524946 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.11878580563146314, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0022791200374934033 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2561567987942721, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.004250537243559008 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.15671768300152755, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0024938518539829066 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.9172897233734647, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07612979258741162 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.global_step84877_gem_xsum_article_DOC_summary_1.json b/8b7178b35b/evaluation/generation/slim.global_step84877_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..bdb534bfdbfe0605106ba9995e3153737b39184a --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.global_step84877_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.2506117820029391, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.004197193925421806 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.265051427357207, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004113838412416427 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.2429048922678839, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0035470294629619853 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.059355725931601024, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0026146656506255265 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06240115907434781, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002528707836330792 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.05697362472735911, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.002319852424027265 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.18675397233452354, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.003437969762757092 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.19744938072178414, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0033460143453592026 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1806939148235656, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002897868234740968 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.18896297297256576, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.003436743475620793 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.20147068575801652, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0034574795296360844 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.18340626109421165, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002921137289513508 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.9617243214867686, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.2121625238447871 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/generation/slim.global_step84877_gem_xsum_article_DOC_summary_2.json b/8b7178b35b/evaluation/generation/slim.global_step84877_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..ebe628daa445f1c780452d63643ad4af1af65492 --- /dev/null +++ b/8b7178b35b/evaluation/generation/slim.global_step84877_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.2862450933885503, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0042447208222623255 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2741637614630613, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0038690227267741645 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.2684969037756941, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.003538515661007479 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.07370429393444561, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.002782856999759695 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07014627514180007, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002596637645417416 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.06850101702956525, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.002469575816155894 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.21544246954500543, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.003580176542199536 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.20674126511922747, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0032887383484612206 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.20209449252255896, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.003025686120342655 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.21658328451330233, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.003567997453456091 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2083566653493878, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0032948366397107273 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.20333325134792413, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0030149542501899957 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 3.790180948775114, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.21949698226608796 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b35b/global_step84877/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/rankeval/8b7178b35b_0.csv b/8b7178b35b/evaluation/rankeval/8b7178b35b_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..ea2af22dc377b4a9ed40df8dcb9fd5b62aacee49 --- /dev/null +++ b/8b7178b35b/evaluation/rankeval/8b7178b35b_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.335,0.014933117490932575,0 +anli_r2,acc,0.337,0.014955087918653605,0 +anli_r3,acc,0.33916666666666667,0.013672343491681819,0 +arc_challenge,acc,0.2738907849829352,0.013032004972989501,0 +arc_challenge,acc_norm,0.2935153583617747,0.013307250444941117,0 +arc_easy,acc,0.6069023569023569,0.010022540618945312,0 +arc_easy,acc_norm,0.5526094276094277,0.01020283238541565,0 +boolq,acc,0.5642201834862385,0.00867262173201595,1 +cb,acc,0.4107142857142857,0.0663363415035954,1 +cb,f1,0.1940928270042194,,1 +copa,acc,0.77,0.04229525846816506,0 +hellaswag,acc,0.44911372236606256,0.004963872936857941,0 +hellaswag,acc_norm,0.5824536944831706,0.004921466591335056,0 +piqa,acc,0.7421109902067464,0.010206956662056262,0 +piqa,acc_norm,0.7470076169749728,0.010142888698862455,0 +rte,acc,0.5812274368231047,0.02969666108123482,0 +sciq,acc,0.869,0.010674874844837952,0 +sciq,acc_norm,0.797,0.012726073744598285,0 +storycloze_2016,acc,0.7071084981293426,0.010523873293246305,0 +winogrande,acc,0.5698500394632992,0.013914685094716694,0 diff --git a/8b7178b35b/evaluation/rankeval/8b7178b35b_0.json b/8b7178b35b/evaluation/rankeval/8b7178b35b_0.json new file mode 100644 index 0000000000000000000000000000000000000000..faa42586e9fb7aeb567270c467ee7008fb38b6b6 --- /dev/null +++ b/8b7178b35b/evaluation/rankeval/8b7178b35b_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.335, + "acc_stderr": 0.014933117490932575 + }, + "anli_r2": { + "acc": 0.337, + "acc_stderr": 0.014955087918653605 + }, + "anli_r3": { + "acc": 0.33916666666666667, + "acc_stderr": 0.013672343491681819 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.1940928270042194 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.44911372236606256, + "acc_stderr": 0.004963872936857941, + "acc_norm": 0.5824536944831706, + "acc_norm_stderr": 0.004921466591335056 + }, + "rte": { + "acc": 0.5812274368231047, + "acc_stderr": 0.02969666108123482 + }, + "winogrande": { + "acc": 0.5698500394632992, + "acc_stderr": 0.013914685094716694 + }, + "storycloze_2016": { + "acc": 0.7071084981293426, + "acc_stderr": 0.010523873293246305 + }, + "boolq": { + "acc": 0.5642201834862385, + "acc_stderr": 0.00867262173201595 + }, + "arc_easy": { + "acc": 0.6069023569023569, + "acc_stderr": 0.010022540618945312, + "acc_norm": 0.5526094276094277, + "acc_norm_stderr": 0.01020283238541565 + }, + "arc_challenge": { + "acc": 0.2738907849829352, + "acc_stderr": 0.013032004972989501, + "acc_norm": 0.2935153583617747, + "acc_norm_stderr": 0.013307250444941117 + }, + "sciq": { + "acc": 0.869, + "acc_stderr": 0.010674874844837952, + "acc_norm": 0.797, + "acc_norm_stderr": 0.012726073744598285 + }, + "piqa": { + "acc": 0.7421109902067464, + "acc_stderr": 0.010206956662056262, + "acc_norm": 0.7470076169749728, + "acc_norm_stderr": 0.010142888698862455 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/rankeval/8b7178b35b_1.csv b/8b7178b35b/evaluation/rankeval/8b7178b35b_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..d13a6a84bd7283b394cc470eb7d0594eec16b535 --- /dev/null +++ b/8b7178b35b/evaluation/rankeval/8b7178b35b_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.326,0.014830507204541044,0 +anli_r2,acc,0.344,0.015029633724408947,0 +anli_r3,acc,0.35583333333333333,0.013826518748493315,0 +arc_challenge,acc,0.31143344709897613,0.013532472099850949,0 +arc_challenge,acc_norm,0.32764505119453924,0.013715847940719344,0 +arc_easy,acc,0.6418350168350169,0.009838331651451844,0 +arc_easy,acc_norm,0.6300505050505051,0.009906656266021155,0 +boolq,acc,0.5574923547400612,0.008687051315181374,1 +cb,acc,0.5357142857142857,0.06724777654937658,1 +cb,f1,0.35670453061757407,,1 +copa,acc,0.74,0.04408440022768078,0 +hellaswag,acc,0.45140410276837284,0.004966158142645416,0 +hellaswag,acc_norm,0.5934076877116112,0.004901936511546116,0 +piqa,acc,0.7388465723612623,0.010248738649935581,0 +piqa,acc_norm,0.750272034820457,0.010099232969867483,0 +rte,acc,0.5415162454873647,0.02999253538537331,0 +sciq,acc,0.913,0.008916866630745925,0 +sciq,acc_norm,0.911,0.009008893392651516,0 +storycloze_2016,acc,0.6996258685195083,0.010600915927985026,0 +winogrande,acc,0.5698500394632992,0.013914685094716692,0 diff --git a/8b7178b35b/evaluation/rankeval/8b7178b35b_1.json b/8b7178b35b/evaluation/rankeval/8b7178b35b_1.json new file mode 100644 index 0000000000000000000000000000000000000000..e204ce1c437928daa6df02ede340bb78ca7d28a0 --- /dev/null +++ b/8b7178b35b/evaluation/rankeval/8b7178b35b_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.326, + "acc_stderr": 0.014830507204541044 + }, + "anli_r2": { + "acc": 0.344, + "acc_stderr": 0.015029633724408947 + }, + "anli_r3": { + "acc": 0.35583333333333333, + "acc_stderr": 0.013826518748493315 + }, + "cb": { + "acc": 0.5357142857142857, + "acc_stderr": 0.06724777654937658, + "f1": 0.35670453061757407 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.04408440022768078 + }, + "hellaswag": { + "acc": 0.45140410276837284, + "acc_stderr": 0.004966158142645416, + "acc_norm": 0.5934076877116112, + "acc_norm_stderr": 0.004901936511546116 + }, + "rte": { + "acc": 0.5415162454873647, + "acc_stderr": 0.02999253538537331 + }, + "winogrande": { + "acc": 0.5698500394632992, + "acc_stderr": 0.013914685094716692 + }, + "storycloze_2016": { + "acc": 0.6996258685195083, + "acc_stderr": 0.010600915927985026 + }, + "boolq": { + "acc": 0.5574923547400612, + "acc_stderr": 0.008687051315181374 + }, + "arc_easy": { + "acc": 0.6418350168350169, + "acc_stderr": 0.009838331651451844, + "acc_norm": 0.6300505050505051, + "acc_norm_stderr": 0.009906656266021155 + }, + "arc_challenge": { + "acc": 0.31143344709897613, + "acc_stderr": 0.013532472099850949, + "acc_norm": 0.32764505119453924, + "acc_norm_stderr": 0.013715847940719344 + }, + "sciq": { + "acc": 0.913, + "acc_stderr": 0.008916866630745925, + "acc_norm": 0.911, + "acc_norm_stderr": 0.009008893392651516 + }, + "piqa": { + "acc": 0.7388465723612623, + "acc_stderr": 0.010248738649935581, + "acc_norm": 0.750272034820457, + "acc_norm_stderr": 0.010099232969867483 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/rankeval/8b7178b35b_2.csv b/8b7178b35b/evaluation/rankeval/8b7178b35b_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..85dbee7822267905b49cad1a5e55259b4b648e94 --- /dev/null +++ b/8b7178b35b/evaluation/rankeval/8b7178b35b_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.325,0.014818724459095522,0 +anli_r2,acc,0.312,0.014658474370509017,0 +anli_r3,acc,0.3541666666666667,0.013811933499570961,0 +arc_challenge,acc,0.3097269624573379,0.01351205841523836,0 +arc_challenge,acc_norm,0.3148464163822526,0.013572657703084948,0 +arc_easy,acc,0.6452020202020202,0.009817629113069696,0 +arc_easy,acc_norm,0.6494107744107744,0.009791003829831557,0 +boolq,acc,0.5954128440366973,0.008584355308932687,1 +cb,acc,0.42857142857142855,0.06672848092813058,1 +cb,f1,0.299808429118774,,1 +copa,acc,0.76,0.04292346959909282,0 +hellaswag,acc,0.45518820952001593,0.004969701081068372,0 +hellaswag,acc_norm,0.5997809201354312,0.004889413126208782,0 +piqa,acc,0.733949945593036,0.010310039263352831,0 +piqa,acc_norm,0.7383025027203483,0.010255630772708232,0 +rte,acc,0.4981949458483754,0.030096267148976633,0 +sciq,acc,0.915,0.00882342636694233,0 +sciq,acc_norm,0.917,0.008728527206074792,0 +storycloze_2016,acc,0.711918760021379,0.010472537019822582,0 +winogrande,acc,0.5761641673243884,0.01388849238994452,0 diff --git a/8b7178b35b/evaluation/rankeval/8b7178b35b_2.json b/8b7178b35b/evaluation/rankeval/8b7178b35b_2.json new file mode 100644 index 0000000000000000000000000000000000000000..d7329d965aa921ecc0d1f74cdfe452d7c3a9df22 --- /dev/null +++ b/8b7178b35b/evaluation/rankeval/8b7178b35b_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.325, + "acc_stderr": 0.014818724459095522 + }, + "anli_r2": { + "acc": 0.312, + "acc_stderr": 0.014658474370509017 + }, + "anli_r3": { + "acc": 0.3541666666666667, + "acc_stderr": 0.013811933499570961 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.299808429118774 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909282 + }, + "hellaswag": { + "acc": 0.45518820952001593, + "acc_stderr": 0.004969701081068372, + "acc_norm": 0.5997809201354312, + "acc_norm_stderr": 0.004889413126208782 + }, + "rte": { + "acc": 0.4981949458483754, + "acc_stderr": 0.030096267148976633 + }, + "winogrande": { + "acc": 0.5761641673243884, + "acc_stderr": 0.01388849238994452 + }, + "storycloze_2016": { + "acc": 0.711918760021379, + "acc_stderr": 0.010472537019822582 + }, + "boolq": { + "acc": 0.5954128440366973, + "acc_stderr": 0.008584355308932687 + }, + "arc_easy": { + "acc": 0.6452020202020202, + "acc_stderr": 0.009817629113069696, + "acc_norm": 0.6494107744107744, + "acc_norm_stderr": 0.009791003829831557 + }, + "arc_challenge": { + "acc": 0.3097269624573379, + "acc_stderr": 0.01351205841523836, + "acc_norm": 0.3148464163822526, + "acc_norm_stderr": 0.013572657703084948 + }, + "sciq": { + "acc": 0.915, + "acc_stderr": 0.00882342636694233, + "acc_norm": 0.917, + "acc_norm_stderr": 0.008728527206074792 + }, + "piqa": { + "acc": 0.733949945593036, + "acc_stderr": 0.010310039263352831, + "acc_norm": 0.7383025027203483, + "acc_norm_stderr": 0.010255630772708232 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/rankeval/8b7178b35b_3.csv b/8b7178b35b/evaluation/rankeval/8b7178b35b_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..bf6a39d15256f52ce110b325ebab5ec40c2666f1 --- /dev/null +++ b/8b7178b35b/evaluation/rankeval/8b7178b35b_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.336,0.014944140233795023,0 +anli_r2,acc,0.349,0.015080663991563102,0 +anli_r3,acc,0.3383333333333333,0.013664144006618268,0 +arc_challenge,acc,0.3037542662116041,0.013438909184778755,0 +arc_challenge,acc_norm,0.32081911262798635,0.013640943091946531,0 +arc_easy,acc,0.6460437710437711,0.009812370644174425,0 +arc_easy,acc_norm,0.6548821548821548,0.009755139387152029,0 +boolq,acc,0.5914373088685015,0.008597580502718664,1 +cb,acc,0.5,0.06741998624632421,1 +cb,f1,0.435174510009433,,1 +copa,acc,0.73,0.0446196043338474,0 +hellaswag,acc,0.45717984465245964,0.004971449552787175,0 +hellaswag,acc_norm,0.6003784106751643,0.004888194985997393,0 +piqa,acc,0.7470076169749728,0.010142888698862464,0 +piqa,acc_norm,0.7535364526659413,0.010054810789671815,0 +rte,acc,0.5812274368231047,0.029696661081234824,0 +sciq,acc,0.921,0.00853415677333344,0 +sciq,acc_norm,0.921,0.008534156773333442,0 +storycloze_2016,acc,0.7129877071084981,0.010460934115933266,0 +winogrande,acc,0.5611681136543015,0.013946933444507032,0 diff --git a/8b7178b35b/evaluation/rankeval/8b7178b35b_3.json b/8b7178b35b/evaluation/rankeval/8b7178b35b_3.json new file mode 100644 index 0000000000000000000000000000000000000000..1db661994747881fbc50959de05c9648a3a54792 --- /dev/null +++ b/8b7178b35b/evaluation/rankeval/8b7178b35b_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.336, + "acc_stderr": 0.014944140233795023 + }, + "anli_r2": { + "acc": 0.349, + "acc_stderr": 0.015080663991563102 + }, + "anli_r3": { + "acc": 0.3383333333333333, + "acc_stderr": 0.013664144006618268 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.435174510009433 + }, + "copa": { + "acc": 0.73, + "acc_stderr": 0.0446196043338474 + }, + "hellaswag": { + "acc": 0.45717984465245964, + "acc_stderr": 0.004971449552787175, + "acc_norm": 0.6003784106751643, + "acc_norm_stderr": 0.004888194985997393 + }, + "rte": { + "acc": 0.5812274368231047, + "acc_stderr": 0.029696661081234824 + }, + "winogrande": { + "acc": 0.5611681136543015, + "acc_stderr": 0.013946933444507032 + }, + "storycloze_2016": { + "acc": 0.7129877071084981, + "acc_stderr": 0.010460934115933266 + }, + "boolq": { + "acc": 0.5914373088685015, + "acc_stderr": 0.008597580502718664 + }, + "arc_easy": { + "acc": 0.6460437710437711, + "acc_stderr": 0.009812370644174425, + "acc_norm": 0.6548821548821548, + "acc_norm_stderr": 0.009755139387152029 + }, + "arc_challenge": { + "acc": 0.3037542662116041, + "acc_stderr": 0.013438909184778755, + "acc_norm": 0.32081911262798635, + "acc_norm_stderr": 0.013640943091946531 + }, + "sciq": { + "acc": 0.921, + "acc_stderr": 0.00853415677333344, + "acc_norm": 0.921, + "acc_norm_stderr": 0.008534156773333442 + }, + "piqa": { + "acc": 0.7470076169749728, + "acc_stderr": 0.010142888698862464, + "acc_norm": 0.7535364526659413, + "acc_norm_stderr": 0.010054810789671815 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/rankeval/8b7178b35b_4.csv b/8b7178b35b/evaluation/rankeval/8b7178b35b_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..4dd88d528f814533e9ba267356be0eb0a8dae8a3 --- /dev/null +++ b/8b7178b35b/evaluation/rankeval/8b7178b35b_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.33,0.014876872027456734,0 +anli_r2,acc,0.344,0.015029633724408947,0 +anli_r3,acc,0.355,0.013819249004047301,0 +arc_challenge,acc,0.29948805460750855,0.013385021637313558,0 +arc_challenge,acc_norm,0.3293515358361775,0.013734057652635473,0 +arc_easy,acc,0.648989898989899,0.009793703885101047,0 +arc_easy,acc_norm,0.6452020202020202,0.009817629113069696,0 +boolq,acc,0.608868501529052,0.008535239054221166,1 +cb,acc,0.5,0.06741998624632421,1 +cb,f1,0.42649620505163616,,1 +copa,acc,0.77,0.04229525846816506,0 +hellaswag,acc,0.4567815176259709,0.0049711062650465545,0 +hellaswag,acc_norm,0.602867954590719,0.004883037758919963,0 +piqa,acc,0.7410228509249184,0.010220966031405609,0 +piqa,acc_norm,0.7486398258977149,0.01012115601681925,0 +rte,acc,0.5379061371841155,0.030009848912529117,0 +sciq,acc,0.917,0.008728527206074789,0 +sciq,acc_norm,0.921,0.00853415677333344,0 +storycloze_2016,acc,0.7103153393907001,0.01048980809194661,0 +winogrande,acc,0.579321231254933,0.0138745263720083,0 diff --git a/8b7178b35b/evaluation/rankeval/8b7178b35b_4.json b/8b7178b35b/evaluation/rankeval/8b7178b35b_4.json new file mode 100644 index 0000000000000000000000000000000000000000..11c0c9e621f4d09bc55697885c8c0c05bcfb6f1d --- /dev/null +++ b/8b7178b35b/evaluation/rankeval/8b7178b35b_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.33, + "acc_stderr": 0.014876872027456734 + }, + "anli_r2": { + "acc": 0.344, + "acc_stderr": 0.015029633724408947 + }, + "anli_r3": { + "acc": 0.355, + "acc_stderr": 0.013819249004047301 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.42649620505163616 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.4567815176259709, + "acc_stderr": 0.0049711062650465545, + "acc_norm": 0.602867954590719, + "acc_norm_stderr": 0.004883037758919963 + }, + "rte": { + "acc": 0.5379061371841155, + "acc_stderr": 0.030009848912529117 + }, + "winogrande": { + "acc": 0.579321231254933, + "acc_stderr": 0.0138745263720083 + }, + "storycloze_2016": { + "acc": 0.7103153393907001, + "acc_stderr": 0.01048980809194661 + }, + "boolq": { + "acc": 0.608868501529052, + "acc_stderr": 0.008535239054221166 + }, + "arc_easy": { + "acc": 0.648989898989899, + "acc_stderr": 0.009793703885101047, + "acc_norm": 0.6452020202020202, + "acc_norm_stderr": 0.009817629113069696 + }, + "arc_challenge": { + "acc": 0.29948805460750855, + "acc_stderr": 0.013385021637313558, + "acc_norm": 0.3293515358361775, + "acc_norm_stderr": 0.013734057652635473 + }, + "sciq": { + "acc": 0.917, + "acc_stderr": 0.008728527206074789, + "acc_norm": 0.921, + "acc_norm_stderr": 0.00853415677333344 + }, + "piqa": { + "acc": 0.7410228509249184, + "acc_stderr": 0.010220966031405609, + "acc_norm": 0.7486398258977149, + "acc_norm_stderr": 0.01012115601681925 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b35b/evaluation/rankeval/8b7178b35b_5.csv b/8b7178b35b/evaluation/rankeval/8b7178b35b_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..8d1987ced554499074b05c93b08bef2eec4d510c --- /dev/null +++ b/8b7178b35b/evaluation/rankeval/8b7178b35b_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.351,0.015100563798316402,0 +anli_r2,acc,0.352,0.015110404505648668,0 +anli_r3,acc,0.36833333333333335,0.013930121355353778,0 +arc_challenge,acc,0.2986348122866894,0.013374078615068756,0 +arc_challenge,acc_norm,0.3310580204778157,0.013752062419817836,0 +arc_easy,acc,0.6456228956228957,0.009815004030251746,0 +arc_easy,acc_norm,0.6464646464646465,0.0098097289481515,0 +boolq,acc,0.6070336391437309,0.008542335147970564,1 +cb,acc,0.48214285714285715,0.0673769750864465,1 +cb,f1,0.3366858237547892,,1 +copa,acc,0.76,0.04292346959909283,0 +hellaswag,acc,0.4567815176259709,0.0049711062650465545,0 +hellaswag,acc_norm,0.602370045807608,0.004884079750433882,0 +piqa,acc,0.7410228509249184,0.010220966031405609,0 +piqa,acc_norm,0.7431991294885746,0.010192864802278042,0 +rte,acc,0.5667870036101083,0.02982676408213828,0 +sciq,acc,0.922,0.008484573530118581,0 +sciq,acc_norm,0.929,0.008125578442487917,0 +storycloze_2016,acc,0.7156600748262961,0.010431614128665242,0 +winogrande,acc,0.5595895816890292,0.013952330311915603,0 diff --git a/8b7178b35b/evaluation/rankeval/8b7178b35b_5.json b/8b7178b35b/evaluation/rankeval/8b7178b35b_5.json new file mode 100644 index 0000000000000000000000000000000000000000..a2141ac525a291160e8f135b0eb0b476cd1e8659 --- /dev/null +++ b/8b7178b35b/evaluation/rankeval/8b7178b35b_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.351, + "acc_stderr": 0.015100563798316402 + }, + "anli_r2": { + "acc": 0.352, + "acc_stderr": 0.015110404505648668 + }, + "anli_r3": { + "acc": 0.36833333333333335, + "acc_stderr": 0.013930121355353778 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.3366858237547892 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909283 + }, + "hellaswag": { + "acc": 0.4567815176259709, + "acc_stderr": 0.0049711062650465545, + "acc_norm": 0.602370045807608, + "acc_norm_stderr": 0.004884079750433882 + }, + "rte": { + "acc": 0.5667870036101083, + "acc_stderr": 0.02982676408213828 + }, + "winogrande": { + "acc": 0.5595895816890292, + "acc_stderr": 0.013952330311915603 + }, + "storycloze_2016": { + "acc": 0.7156600748262961, + "acc_stderr": 0.010431614128665242 + }, + "boolq": { + "acc": 0.6070336391437309, + "acc_stderr": 0.008542335147970564 + }, + "arc_easy": { + "acc": 0.6456228956228957, + "acc_stderr": 0.009815004030251746, + "acc_norm": 0.6464646464646465, + "acc_norm_stderr": 0.0098097289481515 + }, + "arc_challenge": { + "acc": 0.2986348122866894, + "acc_stderr": 0.013374078615068756, + "acc_norm": 0.3310580204778157, + "acc_norm_stderr": 0.013752062419817836 + }, + "sciq": { + "acc": 0.922, + "acc_stderr": 0.008484573530118581, + "acc_norm": 0.929, + "acc_norm_stderr": 0.008125578442487917 + }, + "piqa": { + "acc": 0.7410228509249184, + "acc_stderr": 0.010220966031405609, + "acc_norm": 0.7431991294885746, + "acc_norm_stderr": 0.010192864802278042 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0abf8f8ba186abb14191f7e411f59019d819c3e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17a7f40da817d6e095da220de704ae987ff39ac3b0dab7e6d474a2b68118d2eb +size 208731415 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bc0c53a74a230464fe1be328218140778f2a870 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fda0ed9490bdcdc6d9f37a55b9e6bcc563cf40e916c176aa976c168d2c483547 +size 208731415 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc07eb5917ed918ff59953d5e128a4a1df681faf --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ec3dfbfbe6f4a0d5bb8ee6b6f9942a8656197f57f2dc0481e64d25f48b9cb35 +size 208732183 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cbeee3a1ce3f221555c4b6d36c6c8f7fc9a7e1d --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92acd2ad9cabe2be13cd9b4dd9734e11d06d4548801d00aeef5b3f57357ad0c4 +size 208732183 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c29740cbc2034ce7d7fe11010c47281a0fff2da --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2e6b2f355d4d340eb78de12e9ae4963f175558f777e40dee3bf22492c219e26 +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3bfe1616f6d2a2d98df753826c19f5b5218ac93 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:289deac01544e7b1ce07fc4701fd9fa03711745880779dc8f05c10bc203f25e2 +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_100_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_100_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0dc65e6ae0880d59c874d7911ca59709c7f7964 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_100_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a341db79f99b04ffbc83f7a6e88f07a79902843f0cdd6cb4db677a2f8f6ff162 +size 208732269 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_100_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_100_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c647f9568bdae89a5235707ef56187bb4757d20a --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_100_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eba98f1674c7c7d591616de27894ddbb18c87e16283380ad935862156103192e +size 208732269 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5c638002c2ee33ca297cb49568cea4ea063896a --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7a44dfd8cff80f7852763d3500150d65b6e38cee6bb97632cc99c248a7e4c2b +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b33d3d0f34fcd5261b4fb639d77a15eadc2e41ea --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e682980be80d5c75262b2101f6d76d40277a402aaecffb0bb7903065a3eaafa9 +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_101_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_101_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..079bdcadccc0de15280b4a765b199930b348726e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_101_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15c8f3291cf73e7771156cb99ec43aa0cdf5ef532bb15201f2cac38d9e5de29d +size 208732077 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_101_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_101_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..698baae994927f90216e9465c017b8f22793c099 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_101_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d46d0c192f7e9c9d7ed61b6785772ee5d14bf662a7ac710c6b592bf28490e9ce +size 208732077 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a35c843214f2efecc2c102641826b0e87bc5e56 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3ad556a60fd49790c6e245307a068dc1af7439b2ff5b1168dc1c28f0bac12d9 +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..861428c0a952149a847a2b9d13766adf89ca9dae --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db115d3f985607b09c130f628362a12be1370f36af2fc6a538d997347201d0d9 +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_102_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_102_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62436329a4f89327567350dcae3a96e7a4620a27 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_102_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1965ff8bf1a5f8fb79511103e834c36e1c6d494500fb49d13e229d21f24735bc +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_102_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_102_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13b260f90bd2a0a9e90d60a493647995ad0cfc90 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_102_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb99aea82dfbe4246e19d1985cb4eee220c99efbf555f7e847d1bbd5966bc96 +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59c68902af8754dbbf395f9b09749ff82af28250 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e345a2e0659af1632d2345afc0d9a8a37b773f3a30eec7e41d0065512a5e3e8e +size 208731373 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f93f43795bd197b1d1699dea43150223e6b37ca3 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c37d0e0979766e12223aca6cdc5c139363a781aee9c114815d5019ad777c2b1f +size 208731373 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_103_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_103_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7a5058602777436a7238364bea247f30ad3a0db --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_103_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:037311840f8a70f0bb843719db6c034f020311c627e4166896c12eab22dab581 +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_103_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_103_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04fb6bd751bdcba9486a57772bd925de303daf28 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_103_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e1fd2508123b20fa6403c8929d58fa934bf78ef51f32cd8e2b6e73d7dae3458 +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95ab83207bf7f925de5c993e500b2388e6b59f97 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb07d32700e66a16957faa5b7395a156292580fe9b00d49f30743ba65930b46d +size 208731501 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..301302a60e1cdd30f41e7d17285dc2862c5034b6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f21486724a5e5c2e68c0138a81e0702fc234892b8909db54666a874765213ea7 +size 208731501 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_104_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_104_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8723f541c4c9d3168579486cabb3b228b97df4cd --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_104_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eb8483dee3c169ad26cc181c6c791556da31f2bf608998a20252e0986fb718e +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_104_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_104_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8e88a332c5090ccff98661e792a02acde0c4141 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_104_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6b4a107e22328dbc90799b2b8e577485c05850188caf7ed94e455ff1eb86829 +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e96c5645bdef99b3770c77b71a9cbaa8e04703df --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ed12044c9c5e1c8ce1a77b64cdf934cfd3ed5f901439fdfc3b7868437d0f8b9 +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a94e01b7fbfe3fd480ace90c0b1ad1bf1300b8b8 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c47ad0eceeb6d187b5fa38d76ae33a4c6a8cc35c1e92383db144c417ac225c9 +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_105_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_105_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..489aea5196824610e773efc3dc8d66f4006fcc1d --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_105_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d064db67b8c3038cb909122cb7ee04938aa734f214fd74e2dfd4f7be9fa58a38 +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_105_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_105_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..427b724de54325632dacfa912c5d83369ad5a6e2 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_105_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0559315f1f939cc3259e6c436b5d49bc84a8597ce72ace78ad766b5457600cda +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67a41942e1695dbb8c260e6d197894ad557d1630 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cdcbd15283e6fc6834eed5b69b6ca0aff57d62ae03b449ebb4953e65fcc5966 +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfa455816c447087e42c5c615b5e1c4d32e629fa --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:801064884288984e2741972cef3c1890a7ab3a5487db88bb1b5d41dbc0acb67f +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_106_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_106_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6762da3b379f549dddf3f1c5e0b018b9dc8f02c2 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_106_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20500aee55cb0230f9157b5ce5fa69b40d5d0724f9398646cb34b922f9252a6 +size 208732269 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_106_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_106_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99ff1b68bbc836c0ce16b70fdb0662343dd4e12f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_106_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01b0a1b1396f49d9c761caf3955bb0309cecafd577c30dab35d00de66dfaa680 +size 208732269 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d8ebc472d11f5a2b84273613172b23955c83a31 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd13e62ec6b7eaf68647d1007424d0684245eb478b707828b5aeebdbcc97acd1 +size 208731501 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c91e6e0bf626b8cfa0497e0081ffe37b9fc232f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cb32e3b0628292065a2eb3da6b385f4368b656d335eed7eef0b891f75535fee +size 208731501 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_107_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_107_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15f838e3dbd71d746956c8b9e6de6454c9b0da8d --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_107_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be7bee09b80937d1a30f8446f29dd44dc8f9031801e4bad5700172e903693236 +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_107_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_107_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82e30f900d8382d28e9c87071fe36c09b8d81623 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_107_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31542d6b2b6e33d9b7adea61006a63ca2b9fe90d8c2415acb8d9cbb0cd855f2f +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b107a4cd16e7780953c213e810f18c677e1e1bb --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9059d558f6d27d39f8991ac5e90273fa8254f5fe7e5bf3ec19d0fe3834db0eb9 +size 208731373 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..813e0caa1f2df39eb5544f603784ded5eb65e027 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85c53239e2695378bc77df230568bcc43ae3d0543a56c9e1c71e3a21ff2bc3dc +size 208731373 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_108_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_108_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59633e96992ff97ee9b3868146c940d841f606f0 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_108_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e994e9966e8895f3c8bdab480cdf12e29fd374f17fc7b89f7cb957c42ae00cc +size 208732141 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_108_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_108_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec5c635cf363e307e66d97bf026b52b19c5e37cb --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_108_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6add20384e5b23113efe65870d42ea8d53fe901e38bb03a3071d1b23335e05c3 +size 208732141 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2b5b4796db69627991764b55f35cdbffa14d557 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4ca0cb89fd1b4dd09094d19e20080cdc67a15f3403371848e2a9b340bd6a806 +size 208731373 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49c2d87484e2c86ccc8d13a6425daedc31f8d72b --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfa88b003bd816786b4d8ddc0b61d020a23a5dc3e6a4f656225e680ff67d5722 +size 208731373 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_109_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_109_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07a5527fcdcdf32e8e9a5bfe21a01b05ccdf048e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_109_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17211b223ab3d4d5b3e81184d0d83c40e7b634a9bf45c16fd5735c1f78e79871 +size 208732141 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_109_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_109_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e64e0ac5e718a78d2130023ec4b2420a63df259 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_109_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4a9786029e0fb48f90f9ec4a38b8da4221c47dc1e28ad94fbe3ed93ce3be7b9 +size 208732141 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dbd6e866b818bb1c29d3277a0aea752316af45f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c749a612985ba093cba70e25a24b87835f51e636b996a96b5c2ba27b95d175ff +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a143c2c80d0836be64ecd7c488075dfe5837cd3 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbe716751e91a98310002b89e324fc48fed8daa698e7325b09311ebe9074410a +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47fea6ed54bf6771f2c78a78048b87f72d6b3a81 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5de0519e2832408b09eb252fc6fe2c1c8535c153c13302b006693d297d5cd097 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf4a78f6c86fc9601e265d77516563a934d97495 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7af6726c95f755f03272bc8941632ec15d572ec14ee33879640d08f551b6ad34 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfe6a26cab3eb55654179ec7ce08d566dc298592 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbc524252e8d829fdd8b59d7a59be9e4cfc0d8fda1c37e79cf05f51e50186cd6 +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40c9c5f62d8a2bb9699a38b03eaf0fe3ba54e8f2 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:384006a13d4e2e152924b389e470484a307ec0decddc1da2bd5387dad5263210 +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_110_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_110_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df423996300f65a109cdbade6eb9a228a0e2f8d4 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_110_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd052f92a2a953710ad71e9a9127c48f6e4e5fefc782a5aad1a41bfb45f62ad8 +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_110_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_110_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99f0b05c4c200d7c9ec4fdb498693f8a468ba98a --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_110_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84fa6311a381f51b3d952e5071aed0eaf2a5bf36f68cb48d8521c07c3edd3523 +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..768e53f8cc80cd798bae145372126dfeae30504b --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d976aaa7276f808654921f8d468e788cb33f61a6c2aa3cba5d3b0f62369124b5 +size 208731373 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b180f69e71bb87402d0e2230006343b161f050be --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40984ae639e7c2e0268e8603e481d4be88ba9dcb6d81bdd10bc682289d03b518 +size 208731373 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_111_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_111_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36803fff8d3bb6f6c599052908fb8659184aaa0a --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_111_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6dad8a3623c94d500bc6feaa7ca633fd4f43756a11ffd42fafd20e434d9172 +size 208732141 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_111_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_111_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fec9b42e9fa8d75c54bc8a2d6b10436ea0eb903d --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_111_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcdb061a9ece5fe63014ec1aaf5ecb8913379932868075bb23412f862def4e1b +size 208732141 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba5345d2e208a0a05ad4b82a0885da45d9d16653 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13569d90c3f313a2f538c25f2583bb594df28dcaeae8efcf1f7fee3d025c8f0b +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc243b92d778b9abe02f7bfa533a441b7f759d2e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1266c3035e6b7de4f04f6fa9175959aeeb17d51e778f03f362b292d74a94d14a +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_112_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_112_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9d4bf9ae05d0e961350510eeea69b5702e6ed13 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_112_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1131dfc1f28cc61cb77c7419eabe3927e1d2951d497e57e576ce6625380bf41d +size 208732269 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_112_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_112_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d04c3753133668a057cd1bbdecd35192f07e159 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_112_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7314f06f9b29ced6fcbda5906121fad31ce5782009080d99380023ada51ee78e +size 208732269 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15cbd2457e67e82c3750f718df9d050855f67b12 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:376f43921269aca0feb2802fd9b6bb3d41b398688b2a2e4d9cb27aaa2605b7e6 +size 208731501 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..051442eadc64d015bd10dd8837b6de74e17f8fbb --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cb24f1c5ec3b7334368ef92c9867d579cf9f02934b51423094b6e273bad3bc9 +size 208731501 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_113_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_113_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a19aa50e815f612302b04fb3235fa1e7ab1ea742 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_113_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f2e7ff98dd886734550bccbcf1c4fd53cbcaad6b6cea9bc72c5e04292a74be0 +size 208732141 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_113_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_113_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..411a03bef3c8193b218f86f33b883ec650ca7aec --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_113_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aacfdf1f8c8f889d7cdce6f3806e578dfe403696e2ce84b8dad1ec9e2a80681 +size 208732141 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b54a7889ac806fe9cc3a2b5b0c02d7907420d70 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:414dfbebe019e135572b9287dd95fb8d6dec4a27d5956869dcea167243fa8c6a +size 208731309 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac19965eedded4cb22729277f1a97352c1db8fb7 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5025a3338063768695bd4cb4416a4619b7989f6796f18a1f5562106867a11035 +size 208731309 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_114_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_114_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..458e4674ae9ff9a453cc7a991149e2171de53611 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_114_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd6769883f99391f3a3d197e3a5b04ff5caa5ad09a7a00e887967f40579fbf12 +size 208732141 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_114_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_114_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec97d63c1dc6f2d8ef174fd22f0c38407041eaf6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_114_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cecbfe20b2f88938d95aa9d115eb79b19488b190bfeb67b4cf04423a5a63a0af +size 208732141 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..906bad98f691f70e92138e088d2dd9688e27929c --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae258f1e66bd2a1a6f8e981732174d56a3dbe11ecd7624c5ef36726ce887a02a +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..377294352f954c085b998b7d5b8853aff85bb06f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a0705da96c010cd176f728457bd9363157354c6c75829899558a14ef7c2954d +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_115_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_115_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe5d12266a0d1e2df1fa1d37e989ecda129101c6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_115_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc0e02cd60519a3faa37b720238490917f4ee41ec0c867d8a422b19d70f2f41e +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_115_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_115_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5865ced86628ed01d01b90cb1436492f8787e25 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_115_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bf73520536bd066da549e48642022ab94b4ca26eb6129f119135a21b8b7343a +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a17f24ad3fbfa4ff82cf1a7cb87536fa376dffdb --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecd2f09e458b667b9a23d01f008ebebcbc0a9ee73dd3fec89b65554250a7d53a +size 208731501 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15525958da1482ed8c6212946c87d7636697bcd8 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18bab51bdcedd639fc8e87c44e06da8cd945a6f85a6f93ebb38abc0fdc0260d4 +size 208731501 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_116_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_116_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fd57ad808c908b6e7614f4f28517b0ae663d678 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_116_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f5668999b6bdf9098928ecb2cd34899e9c092a52ea9d50826a7a6e07db88f41 +size 208732269 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_116_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_116_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2240e6e1ab6bda181e93584209fa130512fabe2 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_116_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89f86b41cfd4ca3ba5e0cb39877f146d033b4b2ae451e7e44761bdfecc53cb13 +size 208732269 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75e954de613e38c1f228dfe1fdd4f7a8f29e8d28 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4790d7a71d42a7bc1c627f0da7394634d7cf8628044b648a5d8c571b50bc7cb1 +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aae373450ad8abe067f7f19531690a738bdd4238 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:250042d0da3c550dbe69407de7742f91614b65c9d7bda77ef0d8082c2f8c21fc +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_117_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_117_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed67263827f7262f05e9b907fc330ae9b1d87347 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_117_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5222466e56fc77e27432942e7a0c3177acf8ffc30a418fddbf9c11eb8ec7cc4a +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_117_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_117_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ee4087fd99d3b8b95aad64015f80cb1c93476bd --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_117_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52f26e853dec1faef7d0a24cd2a783a253f74fef01c741b363223b327ccc8936 +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a3e72baf2dbbb2d3b10ae56aef85cf84dfc6c60 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b45aab639bd0ea76f73cd1d90dbb7d38e59feb5262b803d026ceefcc87b0822f +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..169631dd0f24343ea4c16b8e8989bbd0bf11aa8f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8839aef0ffd58d15133658f151305a0a57cec00d21e3eaff482056bbf47b25f +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_118_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_118_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc72dec9201e56fc591bab2160d3f5e224869e88 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_118_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a0697509548e0d86d9aa4fc8f26b9cb0953f59f9732ed0203e9030b78422fa7 +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_118_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_118_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9499648e7165b54b88782afd4ca9cb0d06e1426 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_118_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee52d67e2b33a907113875541184e529e0d2c138e03b15c38f4d4987af713ceb +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..809212e890372744c1901f47387a797cc0318867 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e64aaa38438200201e72ebc6c5c34998e5ff10bd3677d280b4f83e08bacfcde9 +size 208731501 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd4c8d467a0a89b85b94af11caea3f7a06e5522e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e69a7f6150615f35284ed8b742dfbbb83a0455bbc421baafdbf052cf47c32cce +size 208731501 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_119_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_119_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b538b58082c3690522761405bdb4183e7f01929 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_119_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41545114daeb3f61e4dbf2c0f0f312b17c21a359f3456c083220bf9464342d5c +size 208732141 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_119_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_119_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b30d284059c1ac2f453160113be8be033b989e55 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_119_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da1bf0be6bf477ab88efd97e25ed4b55fef854844a25a2846bfd71447c4b16b6 +size 208732141 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c85698e1ded9bd42f57f3a02acf2ead23cc945ea --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d43ae3e5feb2770f52e72416756994ef19ab0864edb51ed020b8860507833945 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8707b51bda109ea58f9b5d73eaa5ba40b6fd8d0 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e099047a227940b6eed2660b2bbfe2944dcc1039c0e72022ec67497b48f5303c +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66f08bf08a31d7f9df34eda68749be82073cf1f4 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443df6ba79f37b6236c9d9512959a5fc49a2212b779a96d6f14a1a7aefea7efe +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37cb897ecb132787700181be30c89dfaa95f5559 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1c08091ef6786d3a01dfb8c378a447ccb057d641878a069654f4f8e1d0ac1f5 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5c79e316d2f6b9e1b3d3ee0f82d713e76a23d9c --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:025b39407c378bfe1692cd72e03e581e27736309f69b25675aa8b42396bdf8cd +size 208731373 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cf0955c36242162f8d1a7dc16927a1475c4413b --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2014989e6ee4c4d478a71576c4e8de35da5b7f9ee71ccf7ba79a516a936233a4 +size 208731373 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_120_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_120_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8f4f211f0cadf8953858555e45afbdc2fc577f4 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_120_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e4e6dc19b5a7a7bea3c85124889238e9aba26ed46b7f926e14cd8aa59b97287 +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_120_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_120_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4af6a6ded6b54f3e32ff73ecab212d6c80ef5d34 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_120_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abe8e4ddde80c4dbee0d1247dd9dff1e5a56fd1e6cde204f6b909adca3eba1bc +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c866f13daace757275e63fe9fe50f1a3b52f9e9e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:882ea097f164c9f507b75bb316c906963aaa6834a12a6593feb3c7b1a01a9c63 +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f494e21d9eebb0dd0124236fdf8ff5985fbb5fbd --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f5dbd3b1fb0361e02f351beb4be0b701119b43110f77a2b2e0127316a72e5dc +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_121_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_121_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13e5941e649f3f00f97d19e21f7eec3ccd705997 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_121_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c07acf7a6d3c7eeb761ac6e2612992169c6472392fff2d8cd63bed058188d72 +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_121_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_121_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c2a1082db72dd5a79636b4b418a670d677ea751 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_121_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f889564980d15caab9aec4683e24d625f65dac0bae1d3af1852e479b4365ea23 +size 208732205 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ca6d2702440f96b628d906f6d1a2962f9193b69 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25f8293c3304c0a0ad861adee2acaf42eb179e6b165d76697b90eb11a1d42870 +size 208731309 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d221e4eb8471b93603d0331dc2ee6a614988524f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c44098e7b7d66aa4ad4e059a331a250ae648ee6c2215fbce4336a3970c85ea4 +size 208731309 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_122_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_122_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a66b645c2cefc4981dca0743a24284e1904d2bb --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_122_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de7cd775c6bbbbc53d3d76ad910d17a485034485638705295e1d2b7f0a9d7b9f +size 208732141 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_122_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_122_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6f9dc81b3793ad2fcb1204c56b5db6047a08e25 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_122_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7d7cbbd9d63522a3b0b28a76529b2dc976eba0697a3f0bd4967aea75dbfafda +size 208732141 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..112b061c6f808037ecd25eb6e099c50ae264e1cd --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:275734ec13c75471c088cbd1cfea652926050b7d3dbc2b87a33e48f1b9706a15 +size 208731373 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba53e1c15b0cf82c8d276112869dc57ea9fe8986 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4d8d72a59716cfb2d1563a7b612cca0a01cd9abefe21d99ee61c0aa8ae1a111 +size 208731373 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_123_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_123_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..762b3a69312bc7cadef38da61a1dacc791ab0aae --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_123_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f515d7dfd6bfc326f923053bfb27c534e434bd658eb7f2642be6ddf6a241bc9b +size 208732141 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_123_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_123_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3154c1dcfd963371d41fd2decfcfdca9f9bd3f74 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_123_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db0c54391d8679aee41adc227421862505e572f2ac957d6d1932fabc268a99b3 +size 208732141 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0626aa2085dd3ae2a6b7d49788bbbb90d82a006 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c2cc9a9f8acdd7f5fb2db8786fba8f15787fa796a68f28a1bf74686fc2d7e02 +size 208731501 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f201f225f498c0950466ed8b0714601b27166c43 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bc643eb556b888ce9bb52042d325accff911805f9f635646955875fbada70fb +size 208731501 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_124_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_124_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..850c6aa9c643c085d126792025931f2b5cb95a35 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_124_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1226965e0775c7fde7fa091c2632f295246be07f705a3ae64e86a6e32356dd4 +size 208732269 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_124_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_124_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb2ac6d84eb8f0e546355d7412989542b2e37055 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_124_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bfd5f2489a86dc69eea2e2374aa4d72644b92a83c98dcfcdf06741dedfe45a8 +size 208732269 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d913b61f68697be5e795b24a33fd6be8294298a --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ddfc68c41bd01e555d185963db21eacd4a04252a2245755b8d3cea6331e7947 +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e6d656c8c947c991f9f2577adba9c1cffe8c830 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73496e54dd5e41f04218847e904b600df9c412f8ab588b38a9aabe9624322059 +size 208731437 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_125_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_125_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e80b239b21e6645ae6d7d7f262c894faa43a7a0 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_125_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39db552cf9b73166e17a9da66170641d79be675c1ac7c959e4da2f8afcbeab06 +size 208732141 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_125_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_125_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93b43805c85bfd419e95c03f8052f20455dbbe90 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_125_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f334d96916beb8042e9c19ed95e7ddfa6c4bb0592de8bbfdc3ae72a25513003d +size 208732141 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54f4ed4f99685354e028185c57b69a8b3954e7ba --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41faa88a9804b826344e509849c7be386f84fd1cc7b59f338e1c6e87f0443b15 +size 208731373 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45b8edec42c09b3c34002cab94eec6a423f3345f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02108c06c09292a05df749e03ede6aef0782745c43236cfb338680d1082d93ca +size 208731373 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_126_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_126_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48828003c32c9526b4f60a06a82f9b7b07ff49af --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_126_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d05d598f13cda34b26c650a60cf5c89c9145483a5a75351ef83cdb01372a45db +size 208732141 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_126_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_126_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cf5cd0538fafd185712e007b2913a5a586c4c0f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_126_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43955c65c9e62d6ea4e49e6431a4546f9dd233f7a730c284e0b2f9a8673d7689 +size 208732141 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28de43dc5c74ff6be2913dcd2fbbbd2aeb53c3be --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c17112ce05ebd89d8490a4758930e264b8ed63b0eb39d533920f95ed91847071 +size 208731373 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..899fcd9e6dad9b40e29198b0b6e7c54662959101 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3be20266a257499ba351e71f342031a607c96c9ce1d2810341316556012c01d +size 208731373 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_127_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_127_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea8b6c780e0301a7e5c3ae45a8c312f76afea438 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_127_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd431570e9885bfb4e9765b07b7bea312a1d3135a21ce3caf7503e307baf3747 +size 208732077 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_127_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_127_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79d53ea17f2548062325bdfe64964851c0cae541 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_127_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afa7765b2ed09e27e7eb6310b60ff4b398e641857542e6ddec284c73080d66a0 +size 208732077 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e923a074f924f3ef42e9426a498467d2a25899b --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc5d06b498618ebee85a01fc839fd269642ff74f9be7f3b6e39ab2e8235d679c +size 208731554 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b045c91fe81b3295e251d0b38cf66267ed33141 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:329181c20a21a0c575cf797244fea0b57997dfff7f4f4da54c6d196594cffb86 +size 208731554 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f12cd341c190999f5d9a3c6e50442421afb4d02 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f02a0f9ba679fe7903b57eb8ba18a2d87fd73e6d369ae77e3d950827053f966e +size 208732322 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04a5001ec2c4476b93a1fdf302a49db28fa341cd --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a8a2be32913384f321b3ce4c95fc619572469464f6396448152e8ff692b5d42 +size 208732322 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..510c6d4539251f4da07bbc41df06744e3d5ae966 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46df43da4dd835b64c341ab27d695ae7f9fb4813b26f5255c6a4fea42b39c6ae +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..199e779b5f14b95fb2ba596c54a6c2750837cae6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d5308d0ee87f863ffc4509d8f158af22b76e6cf80f652ceb1bc9e196aed548e +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba69fe08ae64d86e3e891c74f846dff0906563be --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7f7c4712e6e5a4734e133558e84dc6de244f9912ec4d17b167517244b15be8d +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..950809b5f19ac5bf2289cff2b3b8de21db668e91 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75aa7a2eec07a0c0f58d77edb0e06c3acb0a951cb2afd6d597fdb959692e1e5f +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e6e11ff187fca3aaa674e53b4a0cce8284dc708 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90ab78d2075e352717ed03a3494659f97928670242d267797b08dacbd6d48c9f +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f56f096480c642fd4c7559053ddf7218861f7ab5 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb27308cabba1c1b4b549648a23867160de8b447279b4c1b38169a51afe64789 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..207172c63767db45e2a16ee89974a94d77bb8150 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd2e3bc20e0dbf9f0845369eb591a86cc27270c3caeaa12195acd8b930119785 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1241e7851c8043f7544f9b1e1bd9b1ea80c629b6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3297df3844b80289e68995bd1d5280caac477526061b77aa503c607033408e64 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1cd567881a921db6b065266ae994e0a149a639b --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43e1895cd00ef776e8e40e3fafafc15dc72e8bffd059d8d4e207e52354765985 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9a64f89126ce3822077a9f5087a5d888896f9bd --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cd2e7fa30df7d1b2526f7d33391583464919b596b07f2bb72cb52477b12b7ac +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a42cc36a1c025a5a81c32bd0c2dd43375154d0f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0ed238601c3fa033d7102fac1b4d93c70754f8475b05e2488bb09f58c612cc9 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b15e745def0de07b9ca0737400414a32e41781e8 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a980e4a888819364ad501219ebaabc1fa1174e05b5676218fe7d824cbd7170f0 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..369c419129cf2f8134ed750a766f82ecc4bfb93e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e94c0a4fe61d707b822ab0c470067f3427bdec0ab3b9d5022a28bff34802b66b +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49560c0663ccc5718c3ae3eb3d66ca441f2d24ba --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99dfe7c26dfd4a7084dba7150d70cb4617d541d604ca34b0b502271d0b45c351 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_16_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_16_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22a70b3500d18a928fccc6935fe8f6df9a06ca0a --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_16_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ae8c159bff26ecbffcd4cbd8e33b2c22f8217b05dedd5529c98d4ebbd1d204b +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_16_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_16_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..382e6fbc5bf7ba79451d1344ec25e7bbc0a1adea --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_16_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1ebe0af70de2abf52cb2449b5b2f16662d8c04f66ff96aa10ec218714d37c33 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb6ec5971a5cb3fd83785da05ffd57b5b30db621 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea189cecfe779b2912a337e04ca4dab7305df9bbf4dbb7b362c9a59478a25344 +size 208731298 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f48b2b2995558a568443f8eb7df54adeb12c732 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2afe8302aab64edb6176864bed18709a8befdc8f9cf162b0a8320ec714844c03 +size 208731298 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_17_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_17_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1db6d44edacc7cb8d8b35ea6a8108d1f72a9228 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_17_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51c017902f41b28d9ff90f11fbf3aca6eb19f44b4d05df1fc19db653efbc8087 +size 208732066 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_17_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_17_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9552863761f3c7637b7f25eaec6a4b522e66c264 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_17_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:901ed5a2af2ff07d00ddfa413079b16c675fae252d200125ae7962f4ea73fefd +size 208732066 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5459524b46b745eec88e8a4f47e52c781ee6f7a --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6beb01ceddb45d8ecda83578a1588a22b750c64887ef21da7095895563e6b8a +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da064b6ea4fd643865632bba4dd16243f5d8a1d1 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cafee007b6198a79907d29b74058ecdfefc5ba7e08547480cdd3e72e6ea23ec1 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_18_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_18_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a35549dd3239b92791dc380501c45ff0a193d9a --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_18_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bec2a6796584a9405ae640103c354778971a9322c27e06413ad225636673d26 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_18_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_18_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6821316138f651efcd77b633ca9d2d4613327b24 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_18_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51db8266567bd63e164d512033955785e7f739a4e52e510c9d2bd21a5ee3a2a8 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b07e227cd93fd5d34924a3461ade88d73e90c7d3 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05575f6198f54919c4ea7b2f05b612c40f594f165ac28a6f058b172bfebb140c +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2b608816aa186cac3a752f0e7be9d5198022c94 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0315c5f506ceda2f29a9f8b324edfab872222bd5e705882cd1dbcbd6b752037 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_19_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_19_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..667376017fb9ae22eec0f2d8f61a79cc74802bd1 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_19_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:978364a443b9a2c030a334c3d4b1aaeb376ec1fb4d66c6073b23cb2415c28315 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_19_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_19_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f17a279810f43e8d359f4c17fbba99b276ee4db4 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_19_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a34bc11243bec821a325793fa06c9b99cd83a8636e79464efbfde0eb2609c4ff +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0f5b204df9f09f633a720370d04421825172899 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9a4bb8f76f489ab783785f8f0add626c8a96d399cce326de819c1b75fb221c7 +size 208731351 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b14a0ab24cc8218868087886bd7432cad8122e9 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b659f04f2f5e33c922f3de704e94783227b5b13b0e48e51a398e019604abfe00 +size 208731351 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd88840e04f998d58d02141aea80d68cfab2774f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b72b5755016c800b8db571f60464cb04b1db1ea8312666f894c3e33cfbb02f15 +size 208732119 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c8526e996888d18d85e916d5ef195ace49aa19e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a14f6336a9b34d77e4e841e4f454a234a2aa517f939ddb40f67d8bd3d325566 +size 208732119 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..044f2a36183db55260ea28249fbf9261df13993e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a50ceeefbc7a228818e8f256435303407a8457815a7e9b0c16dc7817848392e +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ab068f7c2258ca3e1469128d864e7af6058873f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45e39732795ea28ff0b46c293a998e2ae24510226bdad7936415aaa5cd526b8c +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_20_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_20_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85b4aa01930d24133c4401d0b5e06602c33fe4be --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_20_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5252ceea2aa0c42340e603c854c74b13a19fdd9c87384114015a69f8fd4f425 +size 208732322 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_20_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_20_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af49a16b4b34e1a7994e41cf1a540d5050463bab --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_20_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05f95ca04ae54745a0ea5f90da5773a95f52bd56f8818fc51fd79d40ef960f78 +size 208732322 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c8dff56b954135d62718b895a4189d06de4bf5d --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad4e99710a25e84015cfa8b013d471c455cca4dcda21a6e5181cc536c1935e3c +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce63a58264175c0753988a034477eb8be7767b49 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1398c46d6d883dc3bf97f55cb3e795a7b88c724425953078361cbb0de9a0a66 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_21_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_21_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..595a68d5af5b71e3b4ba412907ea0428d25b11a6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_21_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c00d6b8410beb496a8cdec4ac7a23699039670e203980d24b798bcf347db4cc +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_21_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_21_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b697000e811ec9e20548cb030f281c8529d7087d --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_21_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd5fd746bc0c23b92eb2b2e5a2324bbb13bcc2e1fe02f01dc2c27b1a1d9b1182 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0834fb5ecfdeee63cd169bede7698a3158e4db76 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb47e77dbb8dce5d92311a2cd3f6d2fc91cd493d0b3ce5c3989ad98520fa0e27 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbf893056357d9e021b0d40bc9ae9babf496e9e5 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e825d3b631711001e58b28dc0f283e1c48cb9a81bcced9ea308a625a39091a48 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_22_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_22_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..803090d5d183ffc09356e2b235daf03172b24585 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_22_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93863fa7b9379f68d402443f81811945965d176781116c32b11715c81bafe765 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_22_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_22_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6ed0456989930b495e839bc54f7533b51d55319 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_22_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ff150cf7b7e04ce38186a870bc798b087e48cf7e23bcc6eaceeb805c02b5d55 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95331659ca7abd062eb89d4bae6131c9dde69305 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dfdd53984313201990145d3237ddbed4e384ed30849180eec9194289c0070bb +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5130fb85849c4eeffe7128c6ed904c7dc32be519 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b56cdef3336799dbf68930ddbd682ddf9239752a289e8150bbfe3103ecbbd412 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_23_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_23_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53f8857723bb148a52cae623438e6bb44e3da86b --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_23_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12c98b6e7b1ca0f3da6a8ef21bf30737465bbdce5332dea5a49f49b8c9075686 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_23_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_23_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a942022329cd8775b3e67e89057d7b45475f514 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_23_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f8d78d109e44f2f4f12b123be4f6e38fd6eee192233d18e21fe637786044ad8 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fe4cc9167b9bcac0645a0c9287a735ec84205a0 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d145960539c48163e6f56bb25a7497b7d9b90f8c26406d6eb928f149269fc7a +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4e36f5908dfdfc4dd8626c17a55d7c411edd84f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:062c3d7c6896f66bcce3af0b7f58e7db1f78ee57777c6def0341ffd9b13fdbc4 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_24_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_24_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f243f1874afa2d8f86c1384d98dbe7a0c2284e16 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_24_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:628e24149cd4ca8e6d0dbd0e9c67f8a50327b689cc7c6e7bbc909b6a795429e9 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_24_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_24_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea9652a5109f8f323ed332e607274f52d44af4ba --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_24_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1124a95a117ca1aa496542c9df8c6fa12fc26fc81244dc47caf2f5132e734ad +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60498127f91f3f0c2b36afa2755ebeaf274e4b93 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd3431e687dca9ba4b3e9ad78a09282c9a72885b4a0e45b1bb22feaef439ba20 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f3bae9fba9c4a1061e9c879ba1b71e7b28b0cca --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfea9330dd3d04215153b4af1cee5eff5d304c0a3dc548666ac14a3c49396ea3 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_25_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_25_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..193780fa137880c878bf6cef6069749158ac9885 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_25_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72cf97eb0e32c86297458552580718d994ed528ce1f0531bf00cec02b7dcd040 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_25_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_25_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22fc0f231a0c7e8b75795ea61ab877764f939ec3 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_25_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb27236599a76d2ec783ba2a697e3fc5822458302ada5c8d528df3f3f6558668 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ef6ae21c99ac1be8dc440f11adec36895a1d170 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb58138f0488142e35ce71c976445868546e2e849550688e6d51f728541db3f4 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0e9752f4c820a571dd4f8abc394c9065086a744 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d13f811feafbb271349509290e91deb6f1c05ac8aeefdd85adcf9540d45032f +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_26_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_26_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6304e76c3f494160fa15289df7f6b9bb57d99457 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_26_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8abebbae7ccbddaad94b5494210c7af21ea2e2ffb71ab335314d4f2a33f3c793 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_26_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_26_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fb18f74242c1588ac73ce50c4e600baa0de6ea1 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_26_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90b3e030cccfa83481cefe166d7ee26f18cf1021409003f4fcf3b949214f3daf +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a63b3e04b7e3211eeb6edbe7e773e0aa0bf36387 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:203d8b6d9a8be922c4d03e59db231b698c7a2e2179b0a44ac87a672e99c6044c +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8af483140181e7cc33e47c6488f9e153bbac9bed --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83d1f7ab9ee829ace7a134d4c07240ee3078c3a034a7124ee50e7e47efa09298 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_27_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_27_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..def7d4972ae596411c97e59cc061a4d5f2fdab3e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_27_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2594c9283a5f489ccc26d8de0b6ccc9bbb0fc22b4748a305dfe2a122850be758 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_27_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_27_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3368876d2b111317ee3a7da731f6375bcf8bdf1 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_27_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea8160d859cdded56235d535b49d83c5cc671ae2ec1afa9cf2e89329bc68ba70 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59137a5075b181e994c10d6de5137c27c6d396b9 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d6bd3894b3f85977837d9b63e0a1cf07e19ca8970a3c179ccbf7b169574eb4c +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b62384c9e4bb3fc33babd10fe6a5036252200814 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc1f5fc61412ea733eebf7247cd01fd8f51c27d426177db424ca752b0242ae61 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_28_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_28_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bea6e7a470b37a6d94fcee5c87d0fe557576ea8 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_28_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20a886236748291ac23508e8c59757479835b41afdb7dae96a425c4af309bc57 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_28_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_28_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0decbf4e39b06ad7b03d215e789c72ab3b5ef8e6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_28_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e54258625d1c92de43e8f1a45aa9ada9d277a556ba26b22aecd5bb248d6c95b7 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1780c7e21fc81ec7b7e440e1a58957c17521788 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:839c0d83371d1e75c1214c20cc8b22fa1d014a4c329986d50e5bcd623d20b9e7 +size 208731298 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40ac9d43d489b616b95fdcbedbbb6d926c241235 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e98101874009f7fa53dbe14d4003bafb64fffe62ef354ec53af503e1f8617665 +size 208731298 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_29_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_29_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7b59dec2e9f29affffd4ad4f7e10e96e10c82dd --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_29_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd8d02eafbc1b681b7721585a5ac0f620277f9216c79b03de3190369975c8ba9 +size 208732066 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_29_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_29_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..913afc48a96132ee89c72c7c729580f18b061823 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_29_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:469fc3b9a2d246883175bd21d2314d052813b694607c61c81279e199c66d974c +size 208732066 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c96595e22ebcc5e72e052fd138bf0bf1129df7c5 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7b7877d19b9e9857e7ea44b238510629b5d84618831dff2904de95b38b7802f +size 208731415 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42efd828adca38c8c2673357e08150cf169bca87 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0d648074bbf3ff37d52cf70dee5e2627825015506c241473152955e1644ef97 +size 208731415 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1e4a918e5ae8ecde09740fddd2a74a2d351ace6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ae16012e69360873a18838bebcc753d9300e1d5fb7fca7ccfc14ad0b48cf01c +size 208732183 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf5a3b54c9a5497ee9608b0880818432bdd85ad6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c67f76c3de0aa43727ba1bc0a5420515c3ebbc267482c82265cb5ab2de3af66 +size 208732183 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f930d0072ff6a3e39f218b461a23eff14697d96 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cc9e52b53211737ea00ec4a38c2a7599b73b5e9a2d4f7ebd1d116d1e8afb036 +size 208731298 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d36d60066eb3692f33de2fbf915c314e61895082 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6815427b42c2d69427038c80d2ac77d1d1fd3c4f1ddb043d6f67dddee40d9d99 +size 208731298 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_30_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_30_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eaeb79a17c15bc5d123efade540d1c8457108211 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_30_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd7dfb89cb7e98d48fa5b1d613e2162d53cac2c93c9bd196c72c4266dc583ec6 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_30_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_30_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e61c94cdd4e53770ea05d9a9eb70f56bee49ed7e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_30_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:321de70b186a51a3ae140e27a1b52ee12f1858fc11ccd0f98de0382ff90cab19 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35c57c8583e63219f10bb60807a65d00bfa65844 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e23b1b329caf7ff75fd376e14a58b839078e1c48a8960b82022a928d6be7ef20 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8841810c97e5a3da8f460d391d4f4e1360b020d --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13d3b61550f9adc56835aaa6d0fb710649f9894f6616cd333dab3d41c4a214e4 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_31_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_31_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce60965f2d0d6a2939521c296b695d8955db6685 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_31_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23f19a67f71b8ac46652f69fbc350f760fc8bc7fb7b8a72c12d36ba4b68333ec +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_31_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_31_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ecfce3f6849bd60e101b6a428986b4a924636ec --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_31_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19d8655ab322800aae6004f6aa8b1059fc758d63ba2c2b9fa01fc6d73023e45e +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30f774101495d15ff617aa326b4638e7915d00da --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c371326983e6456c62ba57ee85d2d205591f906953724ebe56c80f2eb7e6ec94 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01682fa2ea736b3ae6cd6965cf44e519b1be426c --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94724e9088c783540ad8027b85e4c9851ec24fcf34d36ca3cf66d6dc87df9200 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_32_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_32_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d10978945e6c26cd7c8e05ff1863f5304186618 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_32_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0e4e692de7538fb0cb404c1f6afddafd72a9ae817660eaf2941bd81f0527259 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_32_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_32_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..025953dff2867deeee57aadaabdcd33a2558ad8d --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_32_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c37e848ff8b91bacc2257ec280c788549ff3b200be25209ae2866c7d6161e62f +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20750f29cf8e56c4e575dd140a3d4ea0deb06284 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a35673ff69e514479afb03e15edcf32948cc57558a9af7a29b3083e3c754813 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e1035df168b5a629bbe5ff796606d4f864bbcc3 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5f57880f83f0a26bace1626eb5ca51a3f883cc994b7a3ac0ca904fb48614ea1 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_33_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_33_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7468cfae40c37d290959bafec7c11168fcd3fcb --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_33_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:814863c9fe72657dc3e8539b3d3be06e8f568bd127fcfee9aa5445b9001f8278 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_33_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_33_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c54f81f349f425a4bafc6188ae896d6ae21a4319 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_33_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c37789e40289c32eeeb8a3ac0ce2b7c3da7db752ee95016686aee08588d8e43 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50e79c3d65cdab0b92bfc9638a0b9d902e055a80 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40f78c16f72527d73c2002ccf7a9c387ee0934d677d28d0f544a7be210341e2b +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be4b16a3ef39c33dc6d580f0490719c164211650 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0722138a2bdd8704990466044f15e5fc3d2a713920aa9483e1d177ccf7bf1d41 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_34_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_34_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ae3de5046ae871a85b21eed2a933531cf649b9a --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_34_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1984c761619e83d215de465d2b9edf934abf2e9f7aec5abb90673b151c6bc42 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_34_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_34_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ac56e2358e02d9908bf31e1e2ca0151fe7c02f3 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_34_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc36e4d8c698e7e2b84ca2e3a41bc04d6b72f05faead116aeb13596f7a811c80 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bb53c5781eae1e2c1c722d67214ba8afd024a55 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecec6e20427ff643a1df8f021fe0f1f1484597e83cbcccb8d7572c58605914e7 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..051444254ad552a5db6bd8b5efb6aadda1b262be --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02d29b6ed200e7747396e0582d2679a24c0a58b20814a33f6785f6eca4fc6f90 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_35_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_35_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1ab4b40e4a79f785041aacf2aaedec5a19225ff --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_35_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a8661715d5728969c5c03e6b4caf48023b2a25cc8ddbbbff3555f8e21c5d170 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_35_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_35_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12847642cada73e66dcea4f35f53c1a26230d044 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_35_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18ed3538eb163938b6bafa38e3c512bd5284d6b42f06de00be7fb92e851a49cf +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a55440bcfb34b6cccf6242368dbb48bd0e0c4dd --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0602e46a29cf70796bfc34ff5d39accf793597203474d5f96e84c2533a35a2c8 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e814b33582ffde0f1a00375d15795887f0746029 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:941ce6e80416a13921defb67774368bab4b0c1a0713e37121f034d16fa82913a +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_36_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_36_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85afcb98aae187c35068b398a8412e74f686ff6e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_36_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8bb79f8317250f882865fafda9621b9f057aa3abac908b06d49ed99b5ee796f +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_36_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_36_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73e95a6e0ab25cda045183760407ee9053a723c0 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_36_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eba99951965a97bee3be796ea2fb6e90ccbb6d9df71e9b96e92726bba4cacf2 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..944c0dcece5cbbaf479eb7ea1d09c25071533b16 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c43f72e56d045d352bd3ab59ab4bf3e154902016dfe682ec11a30bc18ee35ef5 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b013808e343a09477c76d606b5b8483ec71ceda --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:916afdc4de62467bb2b78a615b434119ee4a74e05486311d874ce91feb4b85ae +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_37_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_37_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..679f6d1624b9b75ff89c9f7d92953331657f6b26 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_37_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:706c5201beaa91ddcb90b3c857099fd060ce114c6960c1cc71107cfaeaaad193 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_37_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_37_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50041a0e62da12ca6fc55e1ee318a9b0a5653c16 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_37_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea4a97bb364755c71cdef038ecf2c03a33fcdbc13e7fb154f99773edd8b6717d +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e49a2f41e9f87886a68b41c4863984873025a6da --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53451f24eb6f5cb4d93aa080de4536e1140ca56d307deb827ab65c47a227511f +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf3ea2ae8e805cdd3f0b47954c04c1ccb684e964 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:583631b92da2cd0a8b25d07970730b730582929caa9b03317a8ab9458f68d3aa +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_38_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_38_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19be155451252b168aeb8faf45b61b354ef84df5 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_38_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bf5256d0a0c5dee05505e4e38ffee68badbbea07fcc50aa5ec3ed0607b4a58a +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_38_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_38_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc8a49c56e3c32515de8081de509fddebb6db557 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_38_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb8870041e3d3907120b2de3954a39d620cff6ece0022a4098438abbe50293c3 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e1cde8ee7a7ed8ac50fb309facdd327b64c2018 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6e4fe2f5de95e104ba23a8359597a1fe81acdeb40c90056e8ffb8af7cfb2f41 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec4e748b4793abe240348567eca2102af843fb0b --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36aa495499e451e4a9cdd33f0d277d3565836750be3312f02134656bedc58911 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_39_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_39_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d155b322721a670e679f8b7f35806adf75ca3ad5 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_39_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9ce1a162390280ec41dd11bf750209df4aebdebd78b27926001fd01aee3aeb3 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_39_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_39_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e8c76424e011fefd4a54d8169d99c77934715fc --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_39_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abb61855a35e51a9529c470a1c8b6184dc5647ce73be99f78c7437b144c8b1e5 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5f2319767e594c86ecb63ce00a4993e2da22671 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a5d3cbfdaaeb30071e5c31ffea67a0fa0711990aafa5e8e320c96c9b9905483 +size 208731351 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76f9f417661b6b65c037d589349b3983ab464366 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:311085b91fb18b1948d44d2f9b999c923a87e1bfc04a12c88488e5cf176e562d +size 208731351 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1f001da13b60a89503be21203347744d385a6bf --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26904b36858de09808922fd226503ffe2d0029b699d5ac51d392ee3182c9f577 +size 208732119 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70764dc1481abafae014421a2f413611ac6407d3 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b8f0333f62ce9d4f52ce8d7070e7fb71416b228ee59c17b3d85e59305867a53 +size 208732119 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..271a8662fe0de232eb11c0c3c0cf95d36764562f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d05f8abe315ba7cfca4b8e2cc47aa556189ae452273177ec34cb189046906c9 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2087411ab700f41d508c4314b8738d6c663cd175 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49acc31ecf2d39dfff06172641062e7ce099e08921a4be143660093863500c5a +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_40_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_40_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff02fea547c2146378943476cf9bd1c5ac93545e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_40_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d99527249e841426c192cc1ac2486b3b9f580a1b625ab181c46158f80f12c8be +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_40_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_40_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c3d7a33602debebdffcf6aa73cb9d18b57b0be2 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_40_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af9c65602e6ebed6922a9a5d751a6e47c6b96bf3c7da9adfe20fb5d64519de30 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6341a35b021e324569de580478d0f744d75c29e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c6b94a05de00779176af6fd6b4c514ef4ea644e63c15be7a45950b18310248e +size 208731298 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..afd317c755756c06d6bc3f7a1ea28602cf803698 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1717616f2b03a82a8f0cacf8086661d4f85e90bfa0497dadc7603b420caf0400 +size 208731298 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_41_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_41_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de958a27da724786ae409192d68a528a49f2f3d3 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_41_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:014ccb1b41a948625f27537ba6d75df4d3f145b2b831d1df7e0c59e83ac645e5 +size 208732066 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_41_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_41_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..726265995a6f5daeac79f5bb00008f030304e153 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_41_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63232c735239c9e5a4055af0b8723215672c76a1235eb0d9ffc5f37b781827d0 +size 208732066 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16664f7f234e768c110b2d6ea42408be48c8bf01 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d69cbd31693b623863630400b3394f7a72546b80f56f4c14fb8b7a8459d71121 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4cf0069d865d07912e07cb36538a874b59072e6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ce89ac12577283321225030fa17f1786e03c13c87af29abd5fcf2c5f11ea291 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_42_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_42_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4c863b0f6a6e8e6c663ffc21138c02c9cf5fcd1 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_42_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9287223121a045a71f242595b9f189f7af8914b7fbabaad029d49c7442638e72 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_42_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_42_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8155bd8b50524c89586fdd3dd040d08eaccb39d --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_42_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3518a70a00bf5e6c63e815b28984793065493b417b9b88fa94e8ed02c9fafed8 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f619ca1d902ede906639292ab18467ad2c958f9 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b59f5e1532f747a457daaf60a807310de19724800a5b7d19b835c1266d4d962c +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d94ddd16493a63826b172d333aba9ac1c49157bb --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07cabe575ee3f511902de3a6b905659d50186b769d2144a48dd7ad9b1f9e9162 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_43_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_43_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..634bf96e1d5f956cfec42f116ab57f1135b7831a --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_43_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:762606ffc2b0213da3846eda7d8eb50f66ae7b9dd2977fecdb1d1907453fb856 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_43_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_43_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a3095fb07625cf974e0f34526018dd6d75bc48f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_43_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1176898bbacdc460c67f90b6df08881e888854312e6aa12c8d4cd404680d96a +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82f35133f0af873a1e17f636ac4187dad9658e6f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20b08ce6da12042ac2bdf17b0fd19eff74aab8177e5bb9144e719157081a33f4 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c745e8783c46a5d0b34a1b2ca3d43290a45aa60 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a00db79ea684ff1b5fc770bece1a652f7dae35b8af863616dd97670a65a89d50 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_44_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_44_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45dadf4d8f25c4d941246b083f21e2854c477bcd --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_44_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71298d22fe2f40d18996c9cbcd7e4823544b39c3e7ce2b5fa839bcd20fd34310 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_44_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_44_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2b18e2690d8fa0f01ee19d5b588c7c326e068dd --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_44_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a2c5d7bafbba160b9bfec29357218d219eaee69d413520c6d974a3090a747d9 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a6c270bd3445bd4846f33d044bf2081a2d26dea --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:643c58ee389d9582c6d3afe40be174aa000a8042bf302825cf0efe7c28c9fea3 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ee2c8feb4930e105480a5cfc86ea45dd9068eb3 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a00160c9ffe61ce51335488ced39216fd935fae31d3b5e7ddd9730560ef7bbed +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_45_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_45_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67b4800bfc37ba210e61c8f9e5c1a6f47ee25426 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_45_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11d45524656d8ec3a4274646ac92d88b7013a6ae2ebaa9419dcedfd813c661de +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_45_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_45_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..838c3f31b9f3d331c9a76052e74590f84416608a --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_45_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90246509508c10055149a3f9f1ad450b0edaa6abfdaefd695f8c92e2aa79bb8c +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69e97003b9926e801ddfaf2134d17b96ccb49f75 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55fb30b46d5dca34ab5145c48c0186d60bcdb95f12be4a84730a66cc6c3c4796 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dcaa617912ecdcf064c933e1aea49feee1bcdda --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40fb35a57008905e67c850ba4279c95917a132834c59fcea9c045961de708163 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_46_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_46_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12e1063fb0c2483f4ae4e49e5dafa8027d697030 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_46_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92d99a2a02aebab6c2d965141b2d81ea30334f864bc4ce01974a28ebedc5f45e +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_46_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_46_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2581f02c3c6fae19a2d105faf4163feb49478160 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_46_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc94998e760378f2910a9bee4ee494b1f561fe905dceed9551ef254d465b0d02 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbb066e2b3da93b0824ad32a43f76276a1c0d059 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03dc48b24c5abb2c333882052a284af85b1ad43eb282f622b8d4ef7c43c35a93 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be3cbd4f9c14a697f4b222f6fcf23d9390429afa --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6989f1748bc61e30e005f8b31b5dfe404f05e5af94d7bdf730b362c3570ecd03 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_47_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_47_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2ffbb697d029ed8ac0a7b620135e34a637db8ba --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_47_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae748cdec75a4e4159ea0711f355175aa1d725c81250955c44c79feb729c991a +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_47_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_47_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b127a219dc5e54ccd12e67e9fbc4f1778f6d96f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_47_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1656e7a1b2dc08a80a6d51ecd18f5f25ecaec7f169e457f579890ebafcb1ee1f +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4cca0376940ab066f589c413eb91913dc3fde4c --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f742019b75bfab3a774999359030f717d4f8e148808c1b84fe5609f92db0e644 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3768c35b152818248381f56786288608fb9da447 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17ea8ada7ae54b3f8a18f8f47dd583dc25036c7c20d506224118d472e0e1f39b +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_48_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_48_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38dc17be030bebd4bc2dbec264050e00eb7821f4 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_48_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26573d8eec9cb19bb0904e9dc5157cc26e659babf242294218af6848c154e5d2 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_48_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_48_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50b3e4cfecd5c9d1344f85c7048f0bb554fc47ad --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_48_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a22a14cf241b94a7fa9a1cec6328e5cff2fb170eb6691a7478664abe4e89e12d +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7edc12d5c8b7c3bd0fa27266de098b1e40aa37b8 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc81360d887f415c7d319e0eea8f0cf589d9513238f73a69b8069304b3b7917f +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d5161bd9337c1375aece67ee9aa596321b4466c --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b081374884874a870cb90720f90e8eb5ade0b05a627a6803d9786ac74824c953 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_49_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_49_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a876f0f02900a5d4d6afce0286516f31853a35e6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_49_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca076768f17d10092cac67cbf7ec0e2d13548122fce774750b34f1080220fbd1 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_49_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_49_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce0461a32504d1aa82a8afd5b72bb87f02a4c4f2 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_49_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea93967f9a6a0fcb5d43929144cca0898214ff9291406a759b2c833db09efa9c +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0005636344f1b1173f33a9c1c0e2cd68148cd99e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5b3b374f9b6b6aa4268faf83733d38a6fe398544348be3e5039614c54f28c61 +size 208731415 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fac06a7d4723f86ccf51d89b1c4c1ed1a53b233e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a3a4ce879936bdcb03e49e53d636ff6b05742412823de97ec0cf5602d5c0f4a +size 208731415 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9888778599eac4315372f306214d3da1fd0d8d84 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d89d4b588b02c36e6e8562c131662f221548e25817986d7e43aada5f40334823 +size 208732183 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57dded04563a01c8cfb7f7a37d0ccd1b3cc435ab --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a04302d73dd746c7b6b4f06cd08e6f6f18c4336af128f9160c155e95aab22f21 +size 208732183 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1c75cb2e4c1c90c51563779521d7b9df244d9a6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57bb49d8ff95180dd549168bbd13f3928dee5afb7b5668da79b2879f8a568f40 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05bba80b1417353b2e95a1528e84539552a0bb81 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:058274dfe3f8225c98cbc2635e3675f6fb024a9136b266a7c308b39bc4bc0076 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_50_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_50_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f7b361bac990e97f001a36611059bc858cfc8d3 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_50_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1894f60d1c23e7c210e07042ab101ca7521b2726311fa5f264eda1b17775fd5a +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_50_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_50_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..325511131cb6b60f279c531fbd7705ef0ec19828 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_50_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d27c3361c44b2ed0b2cfd4bc0c8d350f986230d288d739e9d575c3dd0bc4569d +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a437c762be012cafcfebab88992272f027a5e48b --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b2cd3133ac66cd83f4420e4f73484521f5386b40f1367030d66f3621bedfff6 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36e86dc756c92f36e7e87cf02152c15f0e3669ca --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ed75a881350b35f233313a5555db2b00dd901d3aee5619fba1126a3aa0f17b0 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_51_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_51_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d8595de8f3e307c08924ec6a93a08b573f37c3d --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_51_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49dd4d5b237a47c5f9ea1df1062ba7b51da935e52b910a3135dbd305bfd85815 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_51_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_51_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8ba34ace4e27314ffdd659ebcb80f354ef0cdcd --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_51_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5f2cb8088b8aed0aeab551693aaf70f85771a74da4faafd8b2f3220cd8210af +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f1da49dd817de2f6e29174c0edf12746b346927 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e3e754b8dde5eea5074d09b2fa26cba7bcc7ec4c2fffebb499e56657f424a45 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54d65b078e3f518f0b27e62e60fdbeabc67e9509 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8432752e43d75315f5ec16a22c45db89a0b2e9825c7f23fd182ba2b1202a7516 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_52_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_52_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a260a9206f3818c413ee1a2001592557fc244e75 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_52_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af4402bf1041d0f5b9b86e7219059699c6fc088de6a5f543bb9dc5d060054fc0 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_52_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_52_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ede12cb77f369cf56e5fe478c8fbd8bae7a97fe --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_52_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e85e3f3888cd27fc5571efb519644e8b8621e64f6ce68cba77f3423598c9bdc +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5d5dfd1bf1ae300e6eb89bc457953c22a00ea3f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c7abd8a9c125f364616ca5a639f1b3cecc15c1e5b5c64ffc6ea10cb7a1bdfa0 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e186eaa671f2a97d1b5b1baa8d93cfa51aaf57dc --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b5178a65e04a8f67d97d3e6614f3d267ad4032b1185d80b26fa81286f723d06 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_53_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_53_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..191235158d68cd0c93d7a1504d3662d4af3dae30 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_53_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1eafb1bf18b28c3028af4ed3d810c5c06fb45d8b6f13f77f43e3ac6ce5d0758 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_53_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_53_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..778e34cfe4f8253dce6b0cc16f391739d1d34dbd --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_53_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08462b9ee95793ff3aa2e2b7838d8251d9f76e55fee77a0d7833eb47d5585b10 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b8c73b67dd612a25c7b57c7963a0ca689b67b49 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1fdb2ae686f9b257ce04864e3321e7cfa4c0559ae5d3695a50bdb3ce48b5cd8 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5b7adace5a90fe5768de049eac8c2f1a494f0f9 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a113fdfc6e3e6c8513d9053597c069a1c24a88165205b4e83e90254191354af +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_54_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_54_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69c19a24e2d4cdbe5dc7a3e38ff01aa797e58b53 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_54_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fefd6178313cf5fbf98e52a9d865d4be53d1d81251bffd6d3daa7110f45c94e6 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_54_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_54_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c0e460afd9a0c50c0deb272c86b5a7707a43de0 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_54_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3b6276b3ceef068dc7da12822b721f35553009bdf3617752284c6fbd2a6b869 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..615525795bf98336540a2b7b118afd090f1cc62e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3c0c8012cca56c7bed99ef9b05a846db1c69f9d5bd93e2fbb4ef725b562dcc9 +size 208731298 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51064cf34e42788f3d9b4379351a78b09290d04f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a8a08aea3eb3299b58bb13a71413f226686270450c4128335461bed758aacf2 +size 208731298 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_55_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_55_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b736752add50d5780b33be3ac9f9e16921eb7fc --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_55_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d33de7581075084f27e68a8a399ab42714044cdef36942d9f59c409f20c6f425 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_55_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_55_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39836b4cabdfec2ed0b4d63973dfbfcd0dbd20ae --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_55_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ed13a443070ddca047455e4a317ebe4a0ecd41836b288cfdc4942595062fa8f +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3939190ea6f63832cf6ee0fd57f9ba16a92eca4 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd72df5d1370487812e41b216e20819795393ead54af33a9ede23c90d496be05 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..420e5fda37f7f2734bf2be9d3b9c3b93419579d0 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d03b588210fcf3a441d88672b0cbb3ea3189ec4368501db7a02ff578ac9106b1 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_56_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_56_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0da296b35b59628e44c3b2759062187e2a31fbaa --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_56_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:192088d15c08ee6a5cf0af824149033d8b0bfc91e8fd596b4bc80ea60113f4dd +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_56_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_56_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5074e6b2130e16065c0b57264d88783ae7890bb --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_56_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6137190088e94e272236ca21e611e5abe5b43a913dc5d5ec8c2cd1fed4193cfb +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5848cef796b6f308f7af50e23ff6bf54d8ac29d --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54b039968a29b84cf6cc4e6719db30c33cbc5c7587dd5e47b1b97b1959eec849 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de93637bf91b7bcd9ad201331e27189bf9df83ae --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ac962d45a5efb7a824c232445c72a664454ccec3f97301b5bc7eb4815549bb7 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_57_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_57_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d67bd4529188fd5db2546485d17a2b0d325cd8c4 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_57_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87d2ad34c47aee76ce5220f89fbd2a3eea8f609f63dcc0959f1fda474e7f02b8 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_57_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_57_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eba573f44a1054ac727be9bb75eafc6b8825e3a5 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_57_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc286dc8215839e7aebfc702f3adaf55110026e4d229580a6c363798718b2daa +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..710cf8c7f2e2b6a3e1a2a48423ffd4de1685db4b --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea079aad3ac7bf0a4f5ddbc30f7cd10f029c1519e1c23b663b9b5c3ec01949ab +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4eae8afeea92a3d2f6a70a754e73bdabc992e3b3 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3889cee584dec942b82cd8f50cea94b6bd7324d086027a7555a984fe784be11f +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_58_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_58_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a4f83beb02abe675a145735d316e2a64cb1299b --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_58_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00773cedc84c413c108a37fe1d28f712849479d43296cfcb0e67cb266509b2fd +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_58_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_58_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ca7f9e6ba31f48234d7809f939460910cd49bba --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_58_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:578446497090ee208da2dfcf3b83b95d63960521ebb3f8d53ff2aed6434b4be4 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba396fb40c30474fa57a3f6eb354ba803b3f3cfe --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00d638694ef3cc89a2be3e2cdb6062b0b64f3e122ec87fce3889cbd51d477bdd +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6efe497614aa395b6e428a5f182fb94a15b0319f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45beaef5892e6a76032e293bcbeb541f0db6af1ebd832d6c2b3c2e6a194c5384 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_59_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_59_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00e211c5f212ff95d1902c731910b8fc8c9a2057 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_59_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72c7a31e44fb753ec9f21fe9390deb0770dd986de37937fcd763aa7e994f3a6c +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_59_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_59_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d06287eef486522c5aae74b079ae0ac0855c23eb --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_59_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce6de9150b278eb87c94ff8e819e4087a3adfad61364d8a50783a080e953d25b +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..891185d1613b8d424ca0ccded3aa6ff325c6ccf6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c8575adb4b5ba1b1cc2fa4fb4772e57c994a1d0bfeb283530c56c75e9528f84 +size 208731351 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd982e299d913341c7bfea54f80fe95ae67a359e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c714eca39ccc36aa323793026b3ff129f021806f1500ab5f777349a7353872bd +size 208731351 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a771242e3c79d5062d1c9f3cee5807980d65874 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fba66eac6e5cdf32e78b283524fe405d61f0f1b0e843c7d2015a6af155b11642 +size 208732119 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3121b0d931c4841e832fc96e1448f7b151651f36 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e93c2f26b18e4fa2df7672abcc03da7cec5c45f0ac14cb151e3d1e2fd0fcd977 +size 208732119 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4befa6641c2f4b510705f156f177c41a1a4d6073 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:432b8147a9304ffc7ee1d05e72360638c005752235b35690b8e0223290dd2758 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..137ec692230aacfad6591ca0851878087d7931d6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd2c5d6c31e6c27d463806e733756e13e24859e31fc1e1778adda625663ec6ba +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_60_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_60_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8222cf6721bdb785348caf8b5dbe7459c2b3f5d4 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_60_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:483c80e573971011c5249e30f58e784ac50f9bf38e34faaa79a1afae48255014 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_60_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_60_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2d5edf4d4984ae79fe504f8bc3a80bf72f77a0e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_60_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:990d071c7fb7bcbb90182a5e9b41b5f11607c8a2575716c76a28d49537529d30 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..146c7780988f535415fb7604a2a98a19d7182f32 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:438534501c82f5300bc6898ff57aa3d068b154c64545f89470aadf8aa32a7dfd +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5786e6dbb62a5538a6142525401312bf4a1c0de4 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23e3db429a45cd07d277c399eaa4e9ab9c5f641c88fbe22c1b50f13f703909d1 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_61_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_61_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2c7ecb6fc99258db3e16778fb0cb41d3bfb7fac --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_61_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d11bb420e645919118ffae06b8c44ccbef902997db7fc517853b4bb18530333c +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_61_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_61_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5593c206575952e2ab4da8a195486c109ce77e3 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_61_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff27e521d046116349e433ca3e9f335ad00fe5b218d7abbb0b2ff72c4c4dc7eb +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50cb0e4412cc981a70bb6608a7cfcdd8c8051072 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b70beed68da7deaa4a7111ece095678eca5be6dd94ed14805b6daf688a75166 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..111f0d695289f40b268e2a034ebab0fb33a0637b --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e6301f5e52004c407f1ade53fd9cd3c39bc1f8b8b10db1b0dcf1729beb031ab +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_62_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_62_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..852c11acc5f4c8366182339f4c67ca74a2c94ab1 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_62_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2917077cae875ec51515fa0eab9f37ed16a7b13c192ae1859d100b071f28a82a +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_62_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_62_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16316f6f26b2c45b32376b2f5d3f82c512624986 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_62_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7273d1a2749e358cecf83c39d992095497d164433415bd51f0b8a386e17ec702 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db1fd15cb9771c386b3bca4df2b4fc797e9938b8 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8c22d64e82128c4843b75a6c6ae03469665f21cac41761765f7a9f9c19f913c +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac18d974ff9a5219b87cd92238ed57fad3ac4bd6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0df728997003a27cf94d53770cdcce0e778f2dd2942850f83dd9c566833c4479 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_63_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_63_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffa795a9783681ea848313bd1a5ff3e246627858 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_63_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bc4a6be18872c1e1aa2ad89a9ec3a323ea8e6cb041061f16cfa2eb23df74fa7 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_63_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_63_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a77d91dbed32ceea094dd2316bba08354a6b6e7b --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_63_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99746ba750ae62f3f269d87bfde5add918b347ba807b60ab8fb217c53efb6629 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63fc9017af56fc51f3fae0def5f846e13367bf2e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56e1dd45119d3799b0e41a8ee489e5e46778d62c55d1b808da095650c340b19c +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c8ce76bb9d252ce08bae30c9567627c6a4252f4 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37dc77a8bfbf6b410bc7e3f254d6472722d5db5dc75ae74e1f9c0200dc298675 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_64_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_64_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39553d9ac1e975880ea37a30bf0f9373f78d0c62 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_64_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5683041734e7e8e09eec610404d8ffcfc06df06e445d285cac0dc4ced5d6c78 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_64_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_64_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c7ea9ddb63bbaee273d262188fa408d311adf27 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_64_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ad2363862b45f06704eb4f178c1037bd32947c295a5a363c32b2d07d5811f29 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00d5ac849bdbc1a18fcdc70bd1be08bb63f77850 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b3156966c0d3bdac6fa809ab266aadaa8c9c0b734c95e0c65389becb6cae930 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b11d8aa09e87223cb0bd3305cc57b47010bb0a2 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d205ff40a817da56ffd9d619d8c020934c2e97bbc16f7b834c3befd004b633cc +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_65_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_65_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3cb78ef2bd3b4e1c73822a9ac0baaab62ed5599 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_65_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a85f559cfbb1c2f5cbfa4b094f0803ea293ddeba6c88f3bf94d2002a7b632b0d +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_65_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_65_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3faf74635449a832e055bf83a9ba54318389b9ac --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_65_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:899389a9731e45d47ae4331e234da1a24285777fb402b35677a8e5c9164922aa +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8750b5f8f4dc0c2e8058b7bf74e4d0dc0e401d3c --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f13bb748a5d2d8d1918631e6f5b9ed680208c87a6bc6d734253a8196222c371 +size 208731298 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2b4308f1f2cae44ff1f7adf2115ea988fa4c222 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28b354e358b22c188e49f35d4e1ca885549159b2f2eb241a1090af48279846fd +size 208731298 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_66_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_66_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcc9b7b67daf1f257524adc1f7e4bca92ef1c443 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_66_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c81bfda07aa7ce79b41f60fe50ec12d4bed75e9952bca2512526ae7fe6c16465 +size 208732066 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_66_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_66_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddccb495f7a0f6c1b25e6270d8edacaea08c9e39 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_66_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55667f92ac193303edea48a13c9f9cc04338a8d7c052aff6c79e55a041cee079 +size 208732066 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca64b43696a5f715cc996903168d2627c946e3cd --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af466e512421936ddf4d77f79455c35fae4d390cdc9f19ff4d547b31d1cc99c1 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7607b4ce4db294103ccba116aa9ff5431be04de --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c21cb25322e43f8b45d20a1f8ca18d309ecfd8e156ee418ee2347862348f5b55 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_67_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_67_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0eb81b2bfd9994c30c837f0aec6ede3f73298f12 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_67_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8116d09507e5a251973a5c6a8f36fcf64ed4b4613ce01bbefcdf8a1806b97eb4 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_67_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_67_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..680aa2967ec1679560947a8b3f432f391a1b1415 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_67_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebe15204c48f95573d5e9ecfb730e88a8b7d91997204fa039511f8ca798ae1a7 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03c4481d6314d08b15f55bf632a38673f403fe19 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf06edc054a37c98d089dca762c5fb6705d5282dcda50ebd324303162d89c61e +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fcf7f979fac0d24347673344b0b50415cefc76b --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd13105c08fabc95a0f815e9c34379e45987f7eb56da388bcf4508fb99e75d34 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_68_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_68_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f5c5181a89c7be0bf2031d7963e593daeec7280 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_68_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5817d458257318b67b7771ff9a99b36f52dbcaa5b7d8d7f8f463d4f992977a7 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_68_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_68_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53b50c27e3b78561d81e3c8e8dae1bb16cfcde39 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_68_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db2d8178201670c55bb5b350786a763355ede0cc848eff87a2a307ba7ba06523 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08a5f56b5d8965852ba886a883de602a882f91f9 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:896f3c480de257e7267b34fd965aa2508ab24d9fbe505aeaa2cb7a368695b4ff +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a6b842597a90aaef9d216df4e052f412e590397 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8203e3925b02f67acdb012916f4dd1b50cb0e232cc500e6d236c06cd114ea63e +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_69_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_69_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..978c98339792b8a762da8141d92ca99c456e17db --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_69_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28e1932f7ab58e0db6b62a68ae47ea63aed9a6d8a8a7663c1d4549b021285c46 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_69_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_69_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cbc695d003ef632828aa65dfc28f8522a0f1afa --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_69_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85fdeeadebedaf2dc72350395ad0f6c09f41ccab041da767a7151494bac6ee1d +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76c3df60180b89b36644fdf7d66193a759e3083b --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6335c9604d29d29bae3f9fe619d6d601811a6c63a8ca9522b08b9d0b625c07ec +size 208731351 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bc3e967d0951453a0afaf8b68147d4044a85160 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:494ead74b40c20ed8b029486d8b5775501b69778af9c53cd47fb9d3303b0f0d6 +size 208731351 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d60fafc9703eaf9c24152533e45c008c6672ddd4 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94d02f808f407c3ca97874f2cd2315c9edbc23c055564bf5bbfe9b5572632b55 +size 208732119 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3ec61781aa8207865e49b46f9728c84bd36d279 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d7536aed46bc7e7f0fcca8f82e762f7a6952d7e307b6f7ead043d6d1388c6ea +size 208732119 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8befe53c73e9925d9d7e8753b549bf488bdc6fe --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6765265a2d07ce34771e6dc3087cc927bf28d37ab728fa7f55f0f1c3ba40419 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da2737c93386d7c16b4a71278b5689451fda632a --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b994110678fac4607c275d8a2e1e458098ad418235fd3944bc717e0ec5720c8 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_70_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_70_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21c10315067332e94f3d87da73409978dc08d4bb --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_70_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:792eade0d23de7464a7d31899fdcecf5d3d392be0d93f87733663c951791ecfc +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_70_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_70_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f73a110e2dfe4d912a811b408d3fd304c8259e57 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_70_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e205df76e2b8fcd5bcd3cf6843a752e223624806133bfe1ed63ed6f8d18ea3d +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ed3b8ea72a74ba0eb5771f0f274138ec86dcb64 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5e56f641bb0d7e5bab01186f1071e9ff3cb68ffc4951dceb51760d4ec80c713 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ce9867a087e884791a6bec3fc7dd7f20edb7714 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:677c54add811110029204c3553884a7388796a6a880b3be9b93f96f52753a97b +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_71_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_71_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4d3f4a5662253fb2bb5bd91236b3fe41f388c7e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_71_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac8e6ac06c7e813e7edb9e6b2e23c7fb7c2ed905212a8a5a7aecf2c0e1d346a7 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_71_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_71_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7ad399c1bfa499a933109cecd318797c08425cc --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_71_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90506e0cabaea93babac03cc165763fb2d091ee6e370fd4dea738cdf4a4ef65f +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..398c82b6943c5f8131555f450b2c2a457dff8386 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bee16f26bf57d0472667061c89f0eb7e5b698d63debce4b549c64c93d6a0f125 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5644954d0f4ac81738488aa24532fa215c838e9 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51e7336f4276028fdcede730058c369409e531c310ad9699385239ef409ca47a +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_72_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_72_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3eb2b5edd403748e2808857f2d0e794865246b02 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_72_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7d22690ba59a8ed499659a438110ec194d276266a8521f1784ad13c7e501edd +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_72_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_72_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3eb80fe568dbde5ed0d093c3a3cda4adbf7569f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_72_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af351d7a359d22c127b8a1df463cce3b2df0b81b016e43bf0e19a615d482ac90 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00172a79abd68028fd09c3acd4558321a713e8e3 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9caa22dc5c29d8cd6d7ea30ab9d1ef7853e29d58d43555787a64dda548d44089 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2afe1d6e3753b478281b778528b2f4d319f0e36d --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a4d5560566176c1e000568445a5fb807e9b3124d3dbac06a3f31859f1337fa3 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_73_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_73_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a77fe60e272238de1c6d1f85e1c415d23ac553df --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_73_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72b3fb808e2388bd7a8920160ac53d5c02e7c96cd9b8b6574e578d20bbe7127f +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_73_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_73_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0373409931c40a1170c6b6695aef08764c8e4f13 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_73_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4efea999fa492276f967c0749f1055e853d29f8f73a4a8f73688af8c9a934e27 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f60d5cb20aee1046b846d296df42165a34b8d1d --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1701cf2fa8d68175f38b8480aa85363b69d8f97da55ae3af9269a5d9ea3a32b1 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..997077c1b93ab4e9c0c74153654faf4290ae99cd --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:141c07fed4909bda1115092df6e39513ca4eadfb903c8591d4f8a3a04322c2ad +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_74_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_74_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc1a1f95ec52f967e42be60947a2603354333ada --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_74_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3a3a7d1c7f32a038cabf9430b532c179f30ff7c4b6c56e74bb5f766e5c72741 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_74_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_74_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb93e8184204c7e9d8699575b16632841ebc69c6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_74_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15ce02326e8582b8e5922ca308c189f7b81cf7f845491c446b734c5c706c8b43 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..464546d0896d921aeaeb8fe2602c8144f4dfd24a --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5642f6039fe8a4819287fe7d5067e97be4e14a87541cf2fb9d7110cfdaefbdf2 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9947a02e348f664b6779f22f1ab95aae88cc17c3 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08390f8e294bf9711533de2f3ccd6043210b4a7c0e5594ae8107d9377634ebcc +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_75_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_75_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fec04085b1fa5677e700bbddfc611e244b2c8041 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_75_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecfea1768a84cbd557d718dc1ffbd7d5798311b45c4c3aadb7c6d43c503b00a2 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_75_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_75_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..076a26b68bad95de01121f2593dd9fbed15b47c3 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_75_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f5d7472cadd69a09c00befdb5983d9312ec36e963f4d95c93bc2c4414e1f1ac +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce1be042c0b8d3d05348a1e12615bd666e6c9c22 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4161d3026fd4ae2cba922c4577f74f887c7b3b085fb9fedef146994878ddf7d5 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc5f8511bc9cc7f79f17a4abbd314af35139f54a --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c2eac2a318f03c0a91fd1301a5aa186d229da237087764826b08b2eaa66b99f +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_76_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_76_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d7e2386ccb11ee346609e812ff4e9b123fbb426 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_76_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d69f8390dcc8d6ff8f511200a6d08f507a0d943a21fd96b25e088e33c1b481af +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_76_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_76_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57d9635001a74b1d48cc11e86a2543e958d02763 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_76_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94142d1db199879c8522be6a2058d8040fe0409ce702317b816483899ac77434 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f09f766d590038188234d92ad1596cbaf642cfbb --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e61c4cc4e4dcd3b82afdf4684c1468156f2e7a85fdf0ab84c0a99a3a6778fd72 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bfead08eca96e81beaf6c6abed330623aa31dce --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d2d6bc4d5ccc4280d9ae52b96a4a4f1f134ae753703878c27d66179fc9bb5d5 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_77_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_77_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b0207d11289ef93688a64f31f128dedad01389b --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_77_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cef8d167bf6d52447043c19fdd4520cd5c863191b32b83aca06ae0be11a8f9be +size 208732066 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_77_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_77_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1bbb1ffeeb1a7a762db11ebdd56aa2cd3f5c95e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_77_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:470ed32c18cf04c6e157b1a200df802a904d489021d7a62c16aa46b72c0316f8 +size 208732066 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..231255c4220b436e2b3adf29c85e079283998293 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e1a43031ef6d2071769809b1f8b2aeef9476af4e106193cb11b65af7b2814fc +size 208731298 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ef00650f5e4322fb57940a54f9353ffbbd6f95c --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e8a0b5eb5d51bbc5d002bdd7e0a95b588e5ccdd6d3e994d7dd9ce0fef928dff +size 208731298 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_78_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_78_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5a4eef41ac22320a072861b0fe874170ada36dd --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_78_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36c13d169852f8fea39a24cc55698ecca9c1d22d004754ba7d07913e97924126 +size 208732066 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_78_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_78_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7162b06863525f70d339b67ca3906221202c033c --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_78_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e0561dcb00b55b35a32738ded3a5d80e64e0e269cb1532e7480eef28eb28c2b +size 208732066 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dfd026abac81edb0b6ffedff26608768d201287 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b4b5569c67805f503619bfac333ce8a9c0d4aa1b35604336e2db817da14d908 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b8dd9f631a4796ee9f8d7990140869d38d0376b --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2184fabedf8d83f5f5ca67a59e3dd4fc0f7d6776268cf70e2bacec7fe4fb972 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_79_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_79_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..267bb524fb1c8c767be70e2f10c517e889414695 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_79_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:435de5505c21995b4ddf7bd3b004e6c5af117a4ed6353ff2472c9e70ca4a6380 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_79_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_79_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da19b614e1d19bed868ad37de0b13182c1fc288a --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_79_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5712fce6a57412ed15e948e88d2dc8be78b08d080e763a97039dd616e309e765 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1877df1bb3f48aa5281b4f49842b5c470f95c9a --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4db643a42101c1e175e7b679168dbe45d0d5f07ccc5e2c521cd2ac0647829c7 +size 208731351 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91612ab027e6a6359b0f29a2b4e0724ce4303066 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83d1671031d3ff50f825dc65988bb4e225964598cb2eac1387da1d13f801a64e +size 208731351 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b15aa9d31c71eeacd143311c3122dd698405438f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e8c32d5cb2407716d157d94f2e054905aa3ba342ade4c80c2f59a15414a15d3 +size 208732119 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..988ca8b038ca5235168459b97d0d3b09a3d7d02d --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1207cad63055145ada4f80bb65fd9f19b9f0eb4264934cca59de750d8f2874e +size 208732119 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cf76228bd5e2a06ec797bd6aa9592f3c91a06a6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cedcac3f5981e01cb01a81fc9d7b37e696c9c9612b1dd97e46d84fce2520c18 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..739f6af70bf30e306d7c04f22b03667a30bca79c --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4af5547070ad014648322eb752cc839525f288f34ebe1a044dcadf15e5a88196 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_80_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_80_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e9d6bcffaedd99f237e79620530db13f4ad41bc --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_80_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eef5ec2951c123dffcbcf2989ebdffffa6b7c6cea8f8f434cdd72497abbefb4e +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_80_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_80_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d2c787f11051b5d940f17bfa3eadc386b05e36b --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_80_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:079cd9c55ec6add17c68199cda61bc31ca4d12b8c2eba0e323b2643e44866c88 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7ced2b22cdccb21b99085ceae8cf6a4a3a39cdf --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90de2a3cfd0857e99dc93611374fda3aad84d207ecde94971b08541b5b8add3f +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4126a1cedbb35a26a0bc9ddda9e27810d14f1b22 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c5afd386deb39a3bbac3f3822d8e454dd541fa81b1de7759a5a2d935b0a77c6 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_81_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_81_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..745b39a4ec2514b09909fcc42ccaec7344150a0a --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_81_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97bab0829a94dfd14dbea86542af559003f54bf8c04c38f28e9c161319f847fb +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_81_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_81_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20ed2480e5121d393568f79928beb49aac8df8fe --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_81_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b300e3e97c1e0cd945b9eb1e7a5d7fc28320ea5578eebb487563884d95032b1f +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..258fb5a0576e001af01b40bc0d61c94760d2a1c2 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fef9a7a3852c0b92bf1ceec88743266b78ad3963e7e93fd720658584f5960dfd +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6f115c2e67bfef96990d8a933393c121e23adc4 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b805b79740e5e233265201c96e777d254f98f4c698d1e6159384d98ec07afaac +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_82_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_82_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0c34126619e963e9508ef9c96b16029e5eef2dd --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_82_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4143163090d0f7740e76fec46fa72b6cbaeeeeeabc5230c8bf0d135401632a2 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_82_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_82_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b051b7b31fe49aa5ac641884b82ee124046f6180 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_82_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67ed4e568e49fcada6c2e02050ac52557bf63c58c61c81533b056f431099d1c3 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..673423c9120e74f10167ee76fe9c08a801bb12c7 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f63561861437b924c811bf32ea0f1a1ebeadcaa6526e0793a34280de0fd68424 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06928ec7ebab86ccb4bc73d9b2944942274b1cfa --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b62ae02da9160a6d8b2c0cf3b14d02ba57bc896b5f5eacaef526a76b43076594 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_83_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_83_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce314ca21ae4d035c04369d5e54b480c8b3db8ab --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_83_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7960b36ae66d7943718b6d96deb8db4f359db73f43c3e1230480c989e073f0e5 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_83_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_83_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..710916659c6a93e17ae17a33d667ba9c1c0e22db --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_83_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50086c045e62a79e1957b64d83801eb56b0f574bf04690a4541c64d9f5dc1889 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc4af0e087fbf8ae5c091b6b5ab75d3338261f16 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f4b1a7262fb1492eaa30c94ad1de58e2b5c59fbeb4bbcae7013c88c55d41ec0 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a17c5154ca9690487cd3537355f6f420983169d --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24134a1d2fc87f7441570ff3c8f7137a169914d62cb4f950c9c0c4949106e935 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_84_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_84_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3b97972b85106631b69a9e90b6865d26e0e0c66 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_84_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dbe680775a1ff5b0b3e46ae6823a5e7684072398b9d6860658e50a4bc4f824a +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_84_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_84_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16f9beee256e4a173e7b9918af34a743433609b4 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_84_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0acd1c5d14f826945c3c099c75f4766c4257b972fbf5f0bb1f592484ae0ddd6 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27cd3a965bec24b28bf690db33f8398ad7aa5828 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a69dc94eae2b862d2ce6ec719db5fbbc780f01562718f4f0467149a2745c624 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3be0f09f2f47baec1f88ca66fad44765f5067aba --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e8c259e40f651e4740413c196127886b44d191c683ba6e8b96fb330fdc0f848 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_85_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_85_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..435dab45071ebb9d056dcd4c39557e7a8c918a4d --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_85_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b312d990ea2df6429e4c032da8238680d72034d58de65977c774973f2ca5dec +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_85_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_85_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1a8e6034e6673c3d35a9316fa604f03fa83db96 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_85_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9f648edc962097089e128d6c9fcf4f023652e0ec1b0d1fe637986578c852ad0 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93d6f217e21c1f9c944fe36900ac7dd3fad3acc9 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d807bdf65eb6da63448b3e7945411243fe3cca86fb168485fe10ef803eabfe8d +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6ada89feca73d13630f0fd9264da7d5bc3a1635 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8de52d32c382a470170bae99620890a363ff2df78923ffa0623a60a06527f1cb +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_86_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_86_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bd0853a75b5770c567efd54e621c6ab176bb288 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_86_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43eb9bbb9a2b636a1104148887c0eed1217a8e2f83f6fd0d35d9d7906337d0ec +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_86_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_86_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b864f244730691be6ab6f1fc3ee8b6525508d4c --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_86_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bdc42521d4c9a7057347c8d1a56c0e427fd693d74a689827d88035845bfc83e +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4d3f39e77be66ef8ec506b359544200c9426ef8 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bc18572c2cdbe417fdd8c531bd7505fdfedaa35a01306692609a04822e7d962 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9aa25a61d0cf1b5459862c193da85e3c8b45fb7 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3604f194a04223cad0f0a7b43e27b9232274c92ca1eb9887fb87491a1e84ecc3 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_87_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_87_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de7bdd76a45687c4f371ea436585de89f34f6f06 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_87_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e25ab5b5a7cf470fef1db70800da3f10e7a881ae730e003b38b66819b354f650 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_87_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_87_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c781c698f476a49630f22f0c72faa961cb987631 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_87_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f27e58c6a57de353a802822a1c6aecbd28ea62bcdb90d8ef8ea1bbf280ef5c65 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa115076b49359e2ac3e4b5881dbfbec1d1baba6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:323511c01e7663751f35d1ac9e852ff839a2a14539317595501937f23b10d027 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f5f5c7cc72a45ab8c59737e9e28f575eb7091d6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e3fb5f40f5009252dfb364f7fcb46c29c5caa0c70d21d15fc9fdf03dc696278 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_88_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_88_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20d4ecf5e4b753d45eeca2a36ced5657093cd162 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_88_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1eb7178837e93202dd37a157156d1847b0e423c57d0d65557e0263f00fb5f7e4 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_88_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_88_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a85b4f6c1cb14483d3cf823c33254f8f5f50406 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_88_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0529cdd406339e88d5073065c1b7fd6639900fad174d2f1ae905cf460b65d666 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6e7a606280313c7833be1452afd0df73590f115 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c3f9c3658d72ce9d75052660392ee89d0e7aadc6cf71af450ca064e598bd6aa +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8188d3d58f60a405a0f8d99f989d41b523edd63 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a34852700dbe8f41e45ad663d504b4bfbdeee767be71116dcd9fc80f9a27f89f +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_89_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_89_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..237bb987f72ee928f7a891835e62e31884b2c6d4 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_89_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5019eb3237187ac7cfca5296aa74afc43480f7bdb061129f0f8bddc2aebf5ae4 +size 208732066 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_89_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_89_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90b41644a59048ae388bcacb95f1b9a5af187006 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_89_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:818669a1ab9051689e29fb98e10f08018132f2cdc30e166f39896f2513d35951 +size 208732066 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcd42746dff15ab311bbbad1ea5131683e95df1a --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3423f55bc398af559a0954b1c9daf38833823e03072b642d23ff553079ea8ce3 +size 208731479 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50a990aa07097ecf971fbae6b089142adc7239ee --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdb97a6282ee29f363a2a55005a2dd83ce54197f8766718e721b1624977c7aa3 +size 208731479 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89734d9ff43ae764c027cdf2658dec2a4a064a46 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a423030e7d473364698c8503073a7c214c8dc431bc90d74b41af46b7e15c409 +size 208732247 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cad0b02d04926a9c18254dc9d79c8bf155553f6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca24443bb57219b692472c96bbb8ba773f3bc3e39793434a1615e1aa53b61696 +size 208732247 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fd0bb99686d60b076ce105e93a868b46e6294bb --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed314a021ddf8435fb69c3b809f9d3793004fa99bac1c37c0b1c20a2ac59f27c +size 208731298 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fe66a4183476d58f422de6ac3a81f26b2e2a5bb --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72c83cf14f085d90b20211d4b9a0a20463418697a9abc7f21ea2decf1c720289 +size 208731298 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_90_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_90_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a99f72fb21d3f3ee39d7d696a851ca2a9fb5a76f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_90_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ad5e2b9ad4f503e9741f55143c915853e58a1b95473cbe9f57404385403e401 +size 208732066 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_90_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_90_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d45f9b47f4c25d8d2f5a5b8a8216c3f032452ff5 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_90_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:176921f865ac5c92a0cc40a831177cab6d0a6b59a2aa03200f75a26da60f94f8 +size 208732066 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66933fe3a46938a878a0a381e1e8c8e6fa4121c7 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07ebd533b08a19d701ff5f42030747455712f19c6c0615c5c4bf14d55e7be6ef +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d4bed43cd30e9cff95a821806f64d99bbcbb17e --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5374cf993766a08cfdec9c8a746f16f750077006cd7d69365c6f9c6970941393 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_91_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_91_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..573f7bac8f80dbad6a73fd003a5a3849f9fb1aca --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_91_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:349c482587f4d19822627dcfdf2ee71df7454d16be0d22798ee01bd7edbf941a +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_91_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_91_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a940e7eebe41977466dddb123afa9274ff0b1d97 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_91_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a0b6ff6c5a4a850d24ecbe3b6223e44e1734056d865ba0b500ddd0104055bda +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09595525ad7e28d799bf778ae255c3d3e88c4f24 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e5bdb964fe8a5e8565892f7edfa4cb29cb19dfedb5f4a27bb9a09a49933dd18 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31b6b639a0023fe1d156d8fc58a0179e5297f670 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cac0d3c05811fb0aed60fc7c32db8521c690fef90192d1ed795cca16665373bc +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_92_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_92_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f50276dbb9f13683668e81fcc538d6b175969b27 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_92_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92f29caa2356a3432f2921ea08d36685763b6201ab50549b44a20997b8492007 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_92_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_92_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d065692d1d9eb76e9bb8e86bafd80fb26a039dfa --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_92_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa5e265fffb688f0f9b7495236fa9cb21a72d6edf71090b65d1192ba95161016 +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b267aecf2ae052ba24950f04c95843202c78138 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d562ae60288843d7c46c3616c3a5f6d55f178aaff1eb092a49d5d31b5311dc9 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13a462414abbcf9ffa0448261f6c61f0e9fa05c8 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33de12673143fbc1ffd36b8ea4585b9db5faedc6b93528d837cd1cf0043eff37 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_93_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_93_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d22e97954b805b9af3100e056cafa442d29e87a3 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_93_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:088867571a4cf939f16db8fe88e0f88ee9165f61ebb2be2af319869aa81a8cb5 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_93_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_93_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..acfb8f01b76a682175e58ecbb5e3b7b4b9bea1b4 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_93_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cf72ddba7815eebb7210b53ac15f80f23036dfbd575ec8f6025856ca586a435 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..510b8928a1dc676e2e64db7b0c516c8bd0770654 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f0566d634dc848bf130a7481d80f5c229e2e2577239aaf43bb2b92b36e378e9 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dc3d4ab62ebd9ac7063d35155fcbea94937e89c --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28f06698c61cf7b22948481a64ef8f50f8287aa16f486485fc0158170e7ec421 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_94_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_94_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..165921e76e0833a9c357d0617ea27ba78139a5dc --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_94_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:659cbc4b7c2f23f2ccf2074146a26429728e78a06015bf992b2d382f3554ae03 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_94_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_94_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8005a27b1c8b0db8572ed45890a1b4c385608def --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_94_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:686faea9339b22156e59981677d204658a44cc7876600582ae1f6c76ac8a79b5 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e87fb44ac38ec4f7e570c9174039693258c11006 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98e3cd1e511972cb7a3cebd187e49cadfeab301882c7a8aff9a8d816397f4cac +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a52036b8752abc2d7e283def723dbd3c1e9deaf --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad4d1815277b7b2d537bc1c915b8abc3e443b638bad718cfd1a1f394d11c0444 +size 208731490 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_95_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_95_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2df7b6601a4b70dbf2d40a7be2d7dbc26289b20f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_95_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f222ec8eb8d2f728ca3b379f57cbd68ed17f3116137cee849344b57df5afd30 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_95_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_95_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9fcc22d842077eb2514b02e5e4297f94bc14008 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_95_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45e1e800532622fffb426a3f012170e92b3bdadc6fd58ae595c88532be52f585 +size 208732258 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..430d262a3db58e98e9dcac502c5907953e46e62a --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dce7f2e33270ceb8c0a419fa8eebe8dccc3876f71a0709bc1fb2992e686093a +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad992859ad04ceba7895708f38b745fbe4ca57ef --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a5a9ac155ad322bcc2dc5f50d1cf5de9443e683de3609935129e9b3689e6ad6 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_96_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_96_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..060f6a8435dbd05eaab15ae8ec7edd22537de347 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_96_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16f92683c25b2c002550a2356cc7bfbdad60669ce3e5e27904431cb309987d83 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_96_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_96_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b9863b6893b82db0f432b8184c81e712cccf4de --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_96_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc0231c496e57bf193517a9a6418e026863ddf7f1bed2b24457cec14b022f5f2 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cb0113bc3a5a219d62a8cf4a73e631cd1caef72 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ecd4f2251783aa609213c980e10bda1cc90d9266a754d25e31b1b3d62e1949e +size 208731298 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5204e09dbd013b6330344f9ff4d35feb91cde03a --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8258520af15d7b7ec3b7285e78ed9aea3658afcc9838d1054f23295b276e5b6e +size 208731298 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_97_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_97_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b33aeb92214c8c2f5ec94fbb740958884285bd1f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_97_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d0aed6079017ef646191384c21f1e8e11bd95b615f8e2cbf94c6a57ea5b2e3f +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_97_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_97_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb31229fd3617398f63ef76299e042926fe72b3b --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_97_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a4389f0e86f2efcd403e9ffd844947aaf775dd22a0141b6812614b8a5f31b06 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e805a74b84b5d8c0fc6fc914ecaec237f053b93 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8416e6cac7c185530c9cd11a8989f0582958cb1f745cc5ef72385a5a988c0b4 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d578657c0539ca48dde96057bb76f7c9cdc2ff46 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f4654f96bbc2332898ac62eb43e907bae494421a884a565576d95b3a40e2ce6 +size 208731426 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_98_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_98_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9a44cf01d1233d22a8993ccc25e8e4aeaa86622 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_98_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aea78ab0281f27635d909773ef1abfb67e7baa074c4966d0f5dcc481a2b625cd +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_98_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_98_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67f1bde827c602efbf7db8a9d58196c280a9765f --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_98_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ff0261c5b2d9a388e4e15ff6f31f7028e9c072fa11a1a8a25355dbcebc47c6a +size 208732194 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14d4471eeff7f926b57a01e0d5151f048fb81df7 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dfc0103855e0b22a5fffdc545253a550fc930d0f404928fe4e7456416dfa0d0 +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..933addb8ec6f351188e49c0c6e8b0d2992f172ee --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:073ad2f5c84c7081a932bad5de8e6e43176555f58a3b9ce6314fdeccde52f09f +size 208731362 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_99_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_99_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f172164a7a11cc47ff31a97366000d935927f68 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_99_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaac807a4301d54f51c13b8927d8a587e7c2ed1db51a2f07939197caae633f97 +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_99_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_99_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..538ccbad7c87818021857e29764645155036d2e6 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_99_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7001bbe34b205a594fa899364a2661e924424d22068afe0bd4a07f7eb1f92a9d +size 208732130 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cda481ae395dcf02cd0c91d024cf754b66343f78 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab56013ed06f965810167c4e85d8b32a734859735b64543033e02a8783c88584 +size 208731351 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8dd691f9097fc3af9afa930130a42a9567148a8 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a0e0b016ee7d0f18cdae52f568bbcd89f13cde763dde7f5cebb65e6028b9430 +size 208731351 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca2101b89b24ff714733466c802b851a5bc6e8c1 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2f8e21d64fc6297b2850ce24835cf387db71304df7d1c1fb25cb7fc86bd053b +size 208732119 diff --git a/8b7178b35b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt b/8b7178b35b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0423dd7dc8232d39a8ce03ac33237e5a9361b344 --- /dev/null +++ b/8b7178b35b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:419f0e62d6101da91af15b905af213fe5fa71be339579ad2203f907da051f67d +size 208732119 diff --git a/8b7178b35b/global_step84877/layer_01-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..706dae79e8653eecba7dd8cdf2d832ec99817644 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44da557fafc8b87ae8951b1d5545e18833d9583499e8f2e58b06298bbcf18cf4 +size 223347971 diff --git a/8b7178b35b/global_step84877/layer_01-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f4ed7eca3fefc780357a85d0dc864bb04f43b72 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4ba5172c78b1d5d05c865b91df4a43e2b949678c55690a6fd3d322c43a0237a +size 223347971 diff --git a/8b7178b35b/global_step84877/layer_03-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b08c0d617d53e66103a9c1b5e2755743a1e1983e --- /dev/null +++ b/8b7178b35b/global_step84877/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c48a38188bad96017faa90c5db4c26afc5ed62992a71d5c5461388686c692540 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_03-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..471018d7c9344924683e20b1d8cb89953f6adc2b --- /dev/null +++ b/8b7178b35b/global_step84877/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ef728312f270bba1c0ffb30d233ba8b35d75b5c9038340a0e997fddfac18078 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_04-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29981217c131581202ee38ce8c1bf5ddb9c84da4 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b347b55468ee9d7eea077fa536da2c28c4ad2ea7934d18c17a099565063bd69 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_04-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4a4a6d17ba5938edc139f2e2c186ff87c199c9c --- /dev/null +++ b/8b7178b35b/global_step84877/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:757ac1ee9201cbe9ef9da2438465e1d356c6a1ba81d2bb2862fd5f562b7eb71a +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_05-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e4c15cd24aa0bb4016eda292a4e92428fdf187d --- /dev/null +++ b/8b7178b35b/global_step84877/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1794a26d1fd546f044ffd81e3c6920a3272f3b1b9727bdbb520d8b49a76bda4e +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_05-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b8580230ea3dca339ddb43ccbb2571d58929615 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37ceada786a6e0872ed6ef2e7077de4ddcb5f733a252c26f84872c42bc0340a6 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_06-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3724e07aa15446dff6db0444c2e9696a3cb3c21 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4981d2630f03b9062e26612d4e314b05579c4a57addfb5a74faaa8af217245d9 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_06-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..119f95dca19983937c22892065612e2a2586529d --- /dev/null +++ b/8b7178b35b/global_step84877/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5df5350c9e1bf8b87edee5a1d96210e5deebd1cb740d70adce664a5d697973f +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_07-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..533b967b5691a873451967810180020b574e90d1 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19e437c7198db8709bcd49cb57d491328b20138e520cbaddf858957b85ea09fb +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_07-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8caa27edd1d2e3dd853e6a8bf3692f318e009fd8 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbfbb3318ad6eaf9ed5fa9b637647a96fde1f1424e1c60d0942955bc94ae8628 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_08-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df2161c64466e3fce31a144a1944a1a3642e9efc --- /dev/null +++ b/8b7178b35b/global_step84877/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:844bd4ef2dd5e70df23af804d10dd7798bbe5276d4ea49c53420dce4d3017cb7 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_08-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1c0e325921fb920ca64d8c7ea8d9300fdcad60c --- /dev/null +++ b/8b7178b35b/global_step84877/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d24eca8855cb50736d390fb8b193a3ac8e75241bbe5a3ab322b969ce98f070d +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_09-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01c6058a5bbe775105c1d78f20186b0fe8a6fd74 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eaa301887b3fbcb35b44a61636c460d90e3013c2d799afa26e5d2c2c3601bb3 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_09-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e3a2f4772cd00c29342d56a338bdd1d53afe98b --- /dev/null +++ b/8b7178b35b/global_step84877/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2ca182295dfa645adabc56bb65f60cbb6e4ccb18c9d35312ee0f7619f1e01c9 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_10-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f74d011d2fe0848f306afc2859cb0736e26a13c --- /dev/null +++ b/8b7178b35b/global_step84877/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c497fb2c0377084b1f36b26c07e8da9ead87b39bdfda74e6f53185c78cbeb23 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_10-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a1b8f9c4724551b2ddb1d5c2355dac20d2c962f --- /dev/null +++ b/8b7178b35b/global_step84877/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5bdd6a61d024863896eac9395ed24ba394f283ba716fca6e846b6485cca5f84 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_11-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0741c5c7c9c537c91ab23f4c6838750e02a54320 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:274b70c8f642bbea1225cbdfc28fdb982df905af91c348a7e968e26ccb145b77 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_11-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c11a5d76910678f1918061accc4de8c5b778161 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cf5829f4629d4c83559fe879ae995c9e6bed990ea98e56ed712a2a061598358 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_12-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba904a6bb06f3156d8b3879e3f66aa84d6582ae4 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f0840713220df11b2dd042eb5b8592316b4b9ccfa830f473da5663c2270b907 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_12-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68299f37f46557202f9688c67800609014868a03 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f257fd7b94702c4c3d8a069b4228e8a6cc06d08567a843f0e05db4769e3edf0 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_13-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..561f62d0bffd190aab8f1195410b0546a50b59ba --- /dev/null +++ b/8b7178b35b/global_step84877/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bbf78b519ea80d3ca9205f88b61933c1c5a23339b449637a395654d84405f2a +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_13-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9440572d4438eb62a8d6852579cefb0289b3d91 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf4f94bb9e067ab92f57781d20343edf84af1ef9835dd03917471d62e75ca861 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_14-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b89a518bbbb71b62aef3ed857732118944b57770 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af274fd096726a56a78645b8560a90eaee15ec1704fc618726e22a1ca72e73dc +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_14-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f1925fe333f2f949c9f1161cb38523cb6b3a06a --- /dev/null +++ b/8b7178b35b/global_step84877/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b955ccb012aa08e9ddd5682a1ccb80641e4fc25558bce2e7492d5ed2081e5bb2 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_15-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..644651d0e95054a04456747f60115c3441f452ea --- /dev/null +++ b/8b7178b35b/global_step84877/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb219c071011c1393209963d113b0fee36f3d46e8a65af8e1b3eeee78d2195fe +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_15-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7db7fbeba2a763adde1c086e1bf9d708e9d59eca --- /dev/null +++ b/8b7178b35b/global_step84877/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36f30308ff40990a281579c18483513788f3699af71c02f514340f5d618af624 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_16-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e64d59acecdb251ad164d2a32e4f251e6b1d24c --- /dev/null +++ b/8b7178b35b/global_step84877/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4858203e325bb3367f4f21599e862da68c76691b93f7397f3d1d76752016dafb +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_16-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad33f73b46bc311ae4e9f9886e54a086476463de --- /dev/null +++ b/8b7178b35b/global_step84877/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4804106bb2a9622644a7ddcd204145f1185c63932451236ab94e09091070de37 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_17-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd7e4b546f03797ff500a3756a8d8321ff73bd7f --- /dev/null +++ b/8b7178b35b/global_step84877/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43196525360a6e4b2f1234ed476bc3d9086a34802c777ea8121fbfd0e49e6d79 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_17-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..737a7f00f268a8703b210f1dc4032586400feb03 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:636db2d2e1b9c74cab8a7c2481c145b31f8b0860578c48e988312872acd9aaee +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_18-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a0dc6e65ef59feaceb01971d757937d3651fc0b --- /dev/null +++ b/8b7178b35b/global_step84877/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:743e87149bb6bf5ba993a74a9d1a8dd070aea167f1339b8cafee51e7696b873b +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_18-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8842efea328fe728558e4a9b4a7d5cb7ae3319e3 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52f618db048d1ce9340ef5de60a69f56a7be5139c06ca1a25ccf70de22c49c05 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_19-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9d649e369cb4a14b7c1d6549bc282da24fdb353 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b35a006caf01468c6fe4bc17ef83872003720fa7e9c4cabe854b12391748efce +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_19-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a98db5840cffd6bf6b8da4ad54c47c956ae8c1dd --- /dev/null +++ b/8b7178b35b/global_step84877/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c67d9f8291365aab482ba2ebfeb5afc57830b8d382172d25ebbb6f24e334e7b5 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_20-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42fe30603765b1475cae088def832a8b52dfe556 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bcdb4b864c38fa9ca45a746765cc1446d5d2ff6e1e18fe087144b7664ede4e7 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_20-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03ec82f869d1ffb5641c813437f2b7dd82cd8c3e --- /dev/null +++ b/8b7178b35b/global_step84877/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c057d613cedf0ce34722ac2fc828d761352057b6cc83a2acaf4e1f0bee37c4ba +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_21-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11fdd75087138d9ee0efa1071cc941e206c8f8f4 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dde609c2d0ad35a7f13b46ed15583826f4d30c5f29c7c35dc585c27c75585429 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_21-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23923bcc4db61fc05ccc8d04a97b0a9903e399de --- /dev/null +++ b/8b7178b35b/global_step84877/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74192411efd0b7865f13a4cfbb275eed49fa3951978f54b0c2bfcc728cfd764b +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_22-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aadbf029f985d7d4e261ce98e7de741579294759 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b7bbaebd2ea6dd00d12db84935f927dffbc3c9d874556b2464e3427c3d40b10 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_22-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe5eb428af3bcfa1da56c09cbe2e04d0ad76a5da --- /dev/null +++ b/8b7178b35b/global_step84877/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4962e933814c0dfcc881709303ab24e898029d2df9f857d226884f29dc779f1 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_23-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9224afe5d03dfe6f2cd285d46326568c6c8a8dc5 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:954dcd3826502b07a15d8c04ce4ce3fbb15273ba11775423cabaa55327eccafe +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_23-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da0a524baa77d4f370c1aecc0a8aaa5408748a0f --- /dev/null +++ b/8b7178b35b/global_step84877/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b79b247228b5e5745d143bdfcebd40d749e31cf7ab01879b4d42c62bfa4a7d9e +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_24-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c4a837a6a190ded64655cf370fa12fddd3975b4 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3787c8d3443ed08581a827341b09672d8737b34b66b6dd9aca77b07192ead693 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_24-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c13cc71b17376655a7a610e845bd8e332c09f7e --- /dev/null +++ b/8b7178b35b/global_step84877/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a44fd0155b7f4a06c33315e8e4e858c0489d84f44515e58acf9f29468ba874e +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_25-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03c0f5fe98366fbe2c500fc2714af8b7b182a1cf --- /dev/null +++ b/8b7178b35b/global_step84877/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9b50a2c542b393e83b4875ea5b048d8a7c626dc96752250584ae1a11a9d20fb +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_25-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90c7321f3d208525270d2990d6bf3fee8c2f1c9a --- /dev/null +++ b/8b7178b35b/global_step84877/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aca632298f8b43a70b0c86f422ec63bda82d0281513c0f0e0cfac8a51eadeec +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_26-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49f0330c2d6758397c1373377939e102e54872ea --- /dev/null +++ b/8b7178b35b/global_step84877/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:445ea5ff44e977a690c8a18005e695131b3138247414de83e34eb534e7122fb9 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_26-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..953563563db50c1c5eb932c95f7ebad16d73c670 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:571e869d287df333efdcf546cfc0a1fccc71963879e5c0cbf0940f4e50842dc1 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_27-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3619650f9d3b4505684ea11612fa8afada8e596 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ed8b84c5dbc06e728a6ddbc2e254152b34898468a2f210ce8089e7e2deb1e28 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_27-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87c97e9f681947705d14693fe5454fd11bbdaa33 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f2cb8645ea4f80241171016848fa8c43aa6acd015f35afa61bf3dee07bb0444 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_28-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b9e49b34ae0937f8b79e26a4ad79c68a733c64d --- /dev/null +++ b/8b7178b35b/global_step84877/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a3997cc0ce69887af5ca35baaaa4443ebeb1d6d67ec34d31332044db36d4beb +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_28-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cd47526c614f99909dc5e9d6023ad081cf8812d --- /dev/null +++ b/8b7178b35b/global_step84877/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f50cf4fec1198dbb980e21d065d79015482731adef4af3445220111bfc13d02c +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_29-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bf350f582bafc5e231bef040c56604d2e9e9856 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:423a58fce8c45385c0a390fed79453213744e23c5914c1908e2f9d763ea0d26f +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_29-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04a8775da2ef810c5011cd931dd29383bb4b95f6 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffaacd97285a7958bf32ae706c9841b9d79aa04b35c7eea8f2d96fde2513f10c +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_30-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0da5f78e68a029c1a5c0c4be867880de581b05a6 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e30baea869db1e40a0fd2c333c8ab2c17f60d56b0195cd236dd6cc3cafc0c36b +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_30-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f58d0dc4360fb687671414bd21120e15c3688cf2 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3153ca9a007816506664f07f7ced7dd8f3b41138b4b0f9ec8ee69426b07291ff +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_31-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdaad12c805498da7e8173957b7910a0dc771f40 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:046076e508e33c8a5402a204a05f8622f3c362ee429320ab88a00f968046437f +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_31-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..597e22bc34244a929e57b58bc509b4175e21da14 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:257f1a1086051beefd531900240aa24afad8ff28c2694d45fc3a5d76eb983b30 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_32-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8331648c402fed0d60418e56d7f2c503f93f42a9 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2452d98637833d54fea917437441333cd70034505a7059e44e70b1e0310d3203 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_32-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bfd76afbf6f3b30e68dd0f69240d33002c16362 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb30af4e244e27405ed61835dafe0a61e117c8243fc6c4f60a15bc918045df0c +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_33-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49e0d2af77897f439af31dac279c05a138caf558 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0234c6c37b2edb61c8943d4770a8cacbc1c88f0d52851394e60e2feb82785e65 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_33-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cce81b4668dac1916ce22b532f6369e293de929c --- /dev/null +++ b/8b7178b35b/global_step84877/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a222ad5fd72032c6fc47eecb4e5b08615e56f723319e93dfba6abbe830afc55 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_34-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e6aeb48ef1eec4afcd29c05a8cd92ed98c56040 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b3d7c8e5278b874f74f05b1c152b0a36115e787357dc019fbcc1aa41ebb3c24 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_34-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..712f90edffcc08d4eff2c8b779cb32d726fda709 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa495a68d3625980a56b1277b76fd5b735b4373493453a594a90343e03a5c95a +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_35-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..922fef209f7925e67b6f2f5462c502302eed95f1 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c1ff57cde9dfd07d14361141d284e6712ef04f92bbdf15804a0524746ea9b57 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_35-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bba869bee1e8b29f507e144b4bc8af31c9a42fd7 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8322ba5dc186d30ff442064f1e08d017f5a8682669515f2c3346d89afad2f9c +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_36-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31dde0348e329f31319b5bdeb6c3be19fb591e3d --- /dev/null +++ b/8b7178b35b/global_step84877/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:210e8666285ab954e7da2affcba0b3984ee7c8025c6295d98e0ad48a6611d125 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_36-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39554e1cac1be30d842a5b7e01c449f2e2972c54 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b30213d8b7a6c62e89280df14f4341a943a868f150ba19822fd44e17d444e4d9 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_37-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f53c229e8ec741be3d047f1a4f0a657625d4f87 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed19d1df104840d96e420adf72330da16ea0f2aee5bbed0f3c6dbed34bc1a130 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_37-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e14b23ac9b1559612535e6bb0acf64e936177e67 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9548b0626c4e7613cdc498f1a850a88f23d8dcdebafeae88da9aaac5c48d923d +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_38-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbfcd79decc7b792a5da374bd7f9ecfa56844883 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d26262123a72ca5c525c15c09f101e52fdec6fb600c4462dfccbe7716f9674f7 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_38-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..046627c995c87f002969e419827d2f1dd9443184 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53d84824234fa6ad8ba10f857a2b7c87bcc221ad75bca54c663c13e8bf4f73ae +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_39-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_39-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb12b9a31dde89ce1e119f6691e2f07461cd9a25 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_39-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cc6416ecd437d8884cff319c8792102e4ac35e3b249b19578bd72a271765ffb +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_39-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_39-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e4b6f1ed1d16ed18057dfdd5a29c24ec2f9a648 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_39-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bac8ad63c809220b39543ee8b464c1f8bfc13262ffe295cb9ffaaf4e4510744 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_40-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c511fdb216c619b5560a3d271499619f3beceb84 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c08fd7d4f1c28fada7405e28a50401acb7f365cb35dc3db946e3a7b4bca31e0 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_40-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36b9da34fde3c11f99da1d8b6b7ae26043bcde69 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:801918f5ccd34e5ed44810f7096578142e694e936e8fbd3ec334ffd8d04b1707 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_41-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_41-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a555d417ea59a7d17fafb1e01f11cc2bfe5f2e46 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_41-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a43a8f93561cd95de80f4300ba769709f8c27118be4eccc4ff1cd2789e09015 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_41-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_41-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8210b16ec445a9f5d0ed30ffc432a2ab3e81f89 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_41-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b0e44e0cfa37a453a4f575116c54dc7f5bd6f33ebc1e53781d1a71c3a6ad7b1 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_42-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_42-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9441ddb1611d9f7177185eb49e531138da60e3fd --- /dev/null +++ b/8b7178b35b/global_step84877/layer_42-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e63822650749a8feba1c1fc204a63fa9b923d3c761e47a79d5d554c0766002e +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_42-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_42-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcd3d5ce700ad69811f4c1ff64ef6b962da3d021 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_42-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56962a46d5aa4a10a2a354e5a5358ddfa3587d314d47196514034c83d9f364b2 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_43-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_43-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7501ca730a558820c8ac312ed976622bb002fbe --- /dev/null +++ b/8b7178b35b/global_step84877/layer_43-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b6cb4f2cac44c8ba1a02f7c68958d49b0b5669b91b05d3e204bfdb27b1c38c3 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_43-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_43-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77eb003241832a22efe04a4646406ef80d5b74ea --- /dev/null +++ b/8b7178b35b/global_step84877/layer_43-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf57d48b88059a62c01edf3c2d6906330094297ec1df56451b45f79926e95384 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_44-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_44-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47e380ba38643556855396e40bdc2d0c7a11f045 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_44-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb7648743a419aeb69158ab6ee2da9b07a5a08eb57dad9ac25ef6d8b9720b610 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_44-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_44-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab052c722fddc586f67daa12fa26085b876b1c96 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_44-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ff812861635ed6881361b32523640fdf22a9bae1ba44b4a042bc7f3617311f4 +size 201408771 diff --git a/8b7178b35b/global_step84877/layer_46-model_00-model_states.pt b/8b7178b35b/global_step84877/layer_46-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b235d3b7d1f6ec92492b8341b463a9f55c1983dc --- /dev/null +++ b/8b7178b35b/global_step84877/layer_46-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4f66ccccef2635816844c0fa9b1b9787b757e4daa16b5769c5c4ed7c73566da +size 17603 diff --git a/8b7178b35b/global_step84877/layer_46-model_01-model_states.pt b/8b7178b35b/global_step84877/layer_46-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..961aaffcfc8cf8d2704eca629fc3301864c21505 --- /dev/null +++ b/8b7178b35b/global_step84877/layer_46-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9ae14fb8eade996358f158aeb88a8b74edbded38ede83bfaa9c641fe6c12be4 +size 17603 diff --git a/8b7178b35b/global_step84877/mp_rank_00_model_states.pt b/8b7178b35b/global_step84877/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bb1304cadd1354b34a294727d9cc0013feffd98 --- /dev/null +++ b/8b7178b35b/global_step84877/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c04d95b378249516a1803c108ff03b30134c7d8376ed1b15ac81cc77fe5bf75 +size 40115 diff --git a/8b7178b35b/global_step84877/mp_rank_01_model_states.pt b/8b7178b35b/global_step84877/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17db636e5d894f8a10be69c728d5a6c0ca28f24d --- /dev/null +++ b/8b7178b35b/global_step84877/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca1dc96abe1203ed2ec81fff85c8af588b2296dd137a358cecfaa39e88022c3c +size 40115 diff --git a/8b7178b35b/global_step84877/mp_rank_02_model_states.pt b/8b7178b35b/global_step84877/mp_rank_02_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..557529112c089b38b6f378639f2953f2ea0b7b4a --- /dev/null +++ b/8b7178b35b/global_step84877/mp_rank_02_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0ead56722ebaac41bd8fd697ed86390440faba63dbf0b0aadd1629c347fc6ad +size 40243 diff --git a/8b7178b35b/global_step84877/mp_rank_03_model_states.pt b/8b7178b35b/global_step84877/mp_rank_03_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae92f74a8dc31a3d1c0e88d2d6717f06e756edc2 --- /dev/null +++ b/8b7178b35b/global_step84877/mp_rank_03_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad87d0566dfdbe5c0af8425d58ddc7c2c8948370946af1cf2399f8938dda8a30 +size 40243 diff --git a/8b7178b35b/transformers/config.json b/8b7178b35b/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..eadf3eb13cecae9db1c34cde4f4d373a9d0fe00f --- /dev/null +++ b/8b7178b35b/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 4096, "n_layer": 42, "n_head": 32, "n_inner": 16384, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/8b7178b35b/transformers/pytorch_model.bin b/8b7178b35b/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..cace2b6b70c66046eeaed1c912e71f98b9473b5d --- /dev/null +++ b/8b7178b35b/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1829c16592c505ba768372f80f01072f569e00ef6dfc52eff56354e240300a93 +size 17698351197 diff --git a/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674203794.nid007146.119013.0 b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674203794.nid007146.119013.0 new file mode 100644 index 0000000000000000000000000000000000000000..d52dd9f80ac4adf5669eb4e10150e0890dc5e7f6 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674203794.nid007146.119013.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3142df51530074a69a577e7084dae0ba37f4648799aba4a0c65823d1ab5b7225 +size 26134685 diff --git a/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674376515.nid006305.56293.0 b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674376515.nid006305.56293.0 new file mode 100644 index 0000000000000000000000000000000000000000..1dfa508bf271644bd52c2151eecced0bf6b8b4a6 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674376515.nid006305.56293.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:330af17e1b7d64d46e728d420845a79621a1fd2af4a8a9b837496ae41c5f48f3 +size 55923526 diff --git a/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674549472.nid007079.71773.0 b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674549472.nid007079.71773.0 new file mode 100644 index 0000000000000000000000000000000000000000..d2a8fd437b7b03d2e163d135c0c779f27d032402 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674549472.nid007079.71773.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72e12379ac3b755c01d08983bc56d0f856b2dc39b67c28b24093b6e651a1d357 +size 39144552 diff --git a/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674723078.nid005411.54504.0 b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674723078.nid005411.54504.0 new file mode 100644 index 0000000000000000000000000000000000000000..f7bfb08ddfb521941ec8ab06f83adf1b1e20234f --- /dev/null +++ b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674723078.nid005411.54504.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce0f30d5a9056ae8bf71ee5229c77ff793c6991f6ba59b8b238fdf7623f6c5bf +size 40 diff --git a/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674725409.nid007121.9656.0 b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674725409.nid007121.9656.0 new file mode 100644 index 0000000000000000000000000000000000000000..0788de1166afbf64454fa327c8f1b339c61ca55a --- /dev/null +++ b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674725409.nid007121.9656.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42c6700557591fd75df97080d903069499993ed14dbde7716ee63cbe105559a1 +size 40 diff --git a/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674728989.nid005736.38427.0 b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674728989.nid005736.38427.0 new file mode 100644 index 0000000000000000000000000000000000000000..663e1b8b59a5e12ac171789012b38ef7aaf47044 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674728989.nid005736.38427.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5291ef48de6a68f22880561c1e38f2dfd50890bcb6118ce8607f70f1acd6da07 +size 40 diff --git a/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674910948.nid007079.57589.0 b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674910948.nid007079.57589.0 new file mode 100644 index 0000000000000000000000000000000000000000..3121bcd4d93a5a86d4b099fde745f7c4cbef55d4 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1674910948.nid007079.57589.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36038f9b26b544d7992449535dece63840ca292283c4e40a0b1a53bea449b620 +size 12268610 diff --git a/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1675083632.nid007191.27138.0 b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1675083632.nid007191.27138.0 new file mode 100644 index 0000000000000000000000000000000000000000..80cc66a05b2e6054039cb6f3b16ced65690725c5 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1675083632.nid007191.27138.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ba60d940c7e7d747facf257bd71ae2e8b02750ac754538706cc788f661d9a87 +size 27223434 diff --git a/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1675183786.nid005239.113088.0 b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1675183786.nid005239.113088.0 new file mode 100644 index 0000000000000000000000000000000000000000..71f360ceca69c952e4d979d759221af7674ce153 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1675183786.nid005239.113088.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8259064eb6b6b7492f0cfb5287a0eea4088e3379fb61788d8d941695e13997b +size 40 diff --git a/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1675184263.nid006012.17098.0 b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1675184263.nid006012.17098.0 new file mode 100644 index 0000000000000000000000000000000000000000..a6eaa0ba060c3647841765df8b71181c16182aa4 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1675184263.nid006012.17098.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e81caeeda0d9aa5f2b1f85f383a9a35d2356341df732689f45f1188b7296f4b +size 8794719 diff --git a/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1675212724.nid006461.5702.0 b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1675212724.nid006461.5702.0 new file mode 100644 index 0000000000000000000000000000000000000000..526e8cd5b41798485aeb7c882e4763c651d93580 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b35boscar/events.out.tfevents.1675212724.nid006461.5702.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aba9e9d928c43406f13d6b9f9e8a4797b5e85ffc96b764f5ca1d654782b4b612 +size 22609