diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..216f7366761d492626bc642c592e10ca81f43470 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.33272479915628694, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.031796098410938015}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06768598529946503, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001826760753754374}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.273245918626827, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004811539102181524}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09992028750901691, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002068624719484398}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.0319815601358353, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001123592878248015}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.132780352400067, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0031651283586402535}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.047572357019245066, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012754558397189623}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06526863289287767, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00173604911565671}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2659429125520888, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004693559342531821}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09656759025734364, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019482031642887698}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06475652685202478, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001750562854208181}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.261555669425398, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004531537846674438}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.09550510540717662, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019437957791240722}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..2fa029c9056325b6501ddbd6b14c489cb0a32394 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5102447245370249, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.035376593830697835}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07172631396783712, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0015940647947642393}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3498874090683673, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005494538712125141}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11038438449277037, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019607246874588217}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03374360598633707, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011472248278029387}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.17065910212771632, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0037615577096519314}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.0513340131604287, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012161196627700137}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06735170136224546, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014692804169579693}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.32775015583004236, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.005027007036378035}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10363295036370204, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017764857744676573}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06821168744641012, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015257497030318006}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3303827812174427, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.005034171208777432}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10476642693447911, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001844638754248624}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..0df5375cd824e0876cef5fea133968f85f1224d3 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6028097084858823, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03400607345942724}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07447162662420612, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001363119521612849}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.39133197093760397, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005455286809780116}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11747286047545925, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018369017696682527}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03418924065620199, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008008890429324677}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.19324361036894205, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0038848529810624356}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.054159534529018366, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00112831864459488}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06854684035035577, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012086804724451806}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.35968605242390533, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004868740565794037}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10807779989120546, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001612487862874725}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.0706586243525616, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012889308612371538}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.36945068896305344, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0050409156545949945}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11132296857949775, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017256589790344656}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..bb6987dbf4d9d34234b5fdef1c8486977cd9f3b4 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.701781042691669, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.028304269361164428}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07483297992459019, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013297778153553014}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.40075245309368346, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005510805436391809}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.1186720883935396, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018557604964665015}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03405829473639484, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007867378650100502}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1965036741041513, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0039013830928258273}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05434522629151618, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011369092672670533}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06814102346988, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001142595819228343}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.36375561641075393, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004784629751764729}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10798420755086514, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001585937192657532}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.0705542561432147, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012322784221801353}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.376368921472397, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.005042206855487164}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11180266475563037, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017161756564434687}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..562bafaf07d421c6451c3b4dfbea44b035ea8410 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.7208477776174064, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03611939053214278}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07573522475977945, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012828287982675156}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4140707617730325, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005500874400250013}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12065545317279747, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017878857789550631}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03464259052791206, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007595549203652654}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20555557401100102, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003919174647287531}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05546852434740693, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001093391566003447}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06882833861974198, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00110954922342777}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.37506782401870103, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004831464763832598}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10954384971885704, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001541389309718117}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07144735748031365, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011999248890901264}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3887273820866732, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.005052183598911252}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11373501038504552, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016710119042870925}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..5f1a14d71da3013d9f68cd450c26d929095f95ec --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.8098840843933562, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.042922709276963275}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07551077098651218, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0011967463119907174}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.42778952645041607, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005509208476502683}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12112590895694009, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016877211094516577}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03488380229207791, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007164646591878178}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.21683909270039745, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0040700970178128}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05638496281385114, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010526694616578302}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06816852013471421, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0010570419074259674}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3851255216729155, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004804722289936786}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1091505948569381, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014719382275165554}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07111730496416463, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011271521292987115}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.40225015185589585, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.005071744746719108}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1139947508286874, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015813085492093937}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..6fdeb9c08eba501912ebc17abf07533fa84f3dae --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.15167532178589505, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019073207185280718}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2612333406333799, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026793907173360246}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17820031429089941, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001867331386262004}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.03148570054286659, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007720646786309003}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05626578766960683, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014278552081629383}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03716728942279169, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008623486309823396}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.116140614745089, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013156638447678107}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.2083623246576857, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021996516173952707}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13833033412198834, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013282918104537548}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.13994812048897234, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017518520260318953}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2422441673257693, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0024926109810662115}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.16463728733959723, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017151648189316772}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.604770833205388, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.045152527476120426}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..55aeba24b5157313c069941d64ebdc98b8653d36 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.17995455895644027, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0021143646937022468}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.29822507703809786, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029202005379262794}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.20675601444211894, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019509220985923807}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.04280457785161096, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010705605908791504}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.07256480707864589, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016883207002489}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0485299590695294, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.000987435381157907}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.128484042233791, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014903515496972157}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.21893094707653085, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022685657736807928}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.14838617751760952, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013193585886492735}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1682253075781992, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001983258112076011}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.27945450640399006, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002751044005784169}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.19330419331545362, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001817315871702104}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.3579628914986084, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06443336501226987}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..e16d0d4b4ff08e0e8a0b889d6f0b9ef875b8e86f --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1942548807242778, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0023454682458510967}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.3038516433424921, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028161999694894368}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.21447969004311607, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018895718255246762}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0492948803130678, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011990391917610706}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0782436349256461, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017608820777292064}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05328365330541802, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010288709039921085}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1390228041509367, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017234767147472074}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.22270032621786837, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002252792096654515}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15374474737766516, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013038739578348723}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.18265776299811193, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0022101445170749252}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.28667373859931605, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002687218604461664}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.2018034121125251, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017698133555769187}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.770701026929389, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.055755441860674826}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..53ec1395e25241bc414bcf7155b540551fed1a61 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.16605472663049203, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0026215736776626004}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.24674896622444079, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0032942062409122403}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17584661717144687, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022080154978502656}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.041252526415028114, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0012562811469129071}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06385056201459363, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017227611606126488}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04324074407846396, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001030508940585308}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.12107072019854664, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0020206323069935596}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.18199308221887076, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025743010221870987}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.12719556123913905, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015628923302645156}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.15696755228304862, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0025037796725520395}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.23345046038796602, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003144339747645053}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.166023927031211, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020868492894240698}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.6943492797886797, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.048945628141051856}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..cbfa3d1c3275d40e975c5008187fe3bd16bfac2c --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.05342346190272065, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002056550316894281}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.07978774494235341, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028101467900972705}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.05454947380142532, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001847757669359123}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.012258350990130428, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007138900312061555}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.02028789716505487, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0011428305900431244}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.01286346881894465, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0006471740657104415}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.040366367324606266, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016113191055682687}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.06061271598925825, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021836846333784096}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.0407204750127799, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013676744674585327}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.050133371793595845, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0019436034391785793}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.07473111376648439, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026329914241005055}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.05108474776360767, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017328648234254131}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.5943697556411244, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.030734589500314064}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..8d5a7f6aab29feb5e5a3dd2cc1f33ab37a3299e8 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.008364381665919872, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0008819285241796705}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.012634998947429131, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0012520411703047264}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.008385094317414335, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0007962608828602142}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0019514480000772428, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0002950485643713033}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0034586914827538628, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.000553626619531344}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0020213111085609944, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0002694978086459766}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.006554032979312583, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0006990429427874044}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.010080116076976064, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0010433208473045565}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.006545584095103677, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006266707040781551}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.007976144780102256, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0008419903349386873}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.012040227491122851, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.001201302499319246}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.007958529393460171, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0007541972102063722}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.5595918572619473e-06, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 2.8487471872210672e-06}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..81e083a47947e173f01f1db40e5513332999023a --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 0.01599277764818925, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.004308927933825235}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.012870158730159176, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00026604075009303314}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.02306192594226545, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0005060585834775515}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.016178489257483206, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0003336557540954231}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.00011382113821138212, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 3.0353975217624302e-05}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.00016007109878338666, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 4.471587603586543e-05}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.00012949433318118156, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 3.494334474550083e-05}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.012870158730159176, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00026604075009303314}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.02306192594226545, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0005060585834775515}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.016178489257483206, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0003336557540954231}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.012401587301587743, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0002495014907480676}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.022186928253083223, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00046927560289039864}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.015580467425438196, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0003114685494407546}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..8fa8f6f5699ab0c826f6a66a21d34571a6e8d0cb --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 9.29730492833567, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07258438562915104}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4508609495206719, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0036311478842959532}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4256279851535847, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002998743529748849}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.40179356473852385, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024053635164423257}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.20803358909759323, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002540052178876273}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.19234516196309973, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021041392938787457}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.1821558520162302, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0018839477104031566}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.33647256551604726, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029522675564527113}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.32133682780546957, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025106371554624155}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3001108360092531, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019304143016397508}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.36851923372760476, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0033065014951933927}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3458837990441542, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027230707350231853}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3272696975463691, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002280428848910135}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..87055869b7a95795384480521c63da5135dca3f4 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.759775802861823, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1293139727386451}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5296073064762413, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0033783994941725144}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4363790698973518, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029267544023528365}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4496590978589395, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002303602978907222}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.25851059818334, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026408591114483963}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.20978543572844377, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002146572930760848}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2160790254378622, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001955317829071995}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.39232032536879197, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029964581011695346}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3219131393183246, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024670087975040625}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.33140579758047195, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020369186351820263}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4374911840880169, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0032563934045941744}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.35889049112539584, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027163755824492135}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3703216404379091, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022909574817028392}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..77b82b6887a2b0049eeb3eb2b6fbe4e509f48891 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.39712229435215, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.2190368432916537}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5434706515030117, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032446983744738762}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.43747355273891847, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028993863830845397}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4585328203108971, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022516911107973987}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.27356714226869305, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026390580957758175}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21639197788244496, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021805025438367607}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2270812503617402, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019758386181450292}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.40618251147113754, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029740816706799833}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3236014788599963, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024273522496127556}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.34028277436237736, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020545641994681512}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4532770963097311, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031647100865919084}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.36298447462453876, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026887391183781422}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.38125456908954924, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002257169022713513}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..fdb9fb6e8dfafe6c07f93c8046751fc6587990e9 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.278538903088437, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.19304270040523466}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5550942770770999, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00321920680863295}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.43254174724244665, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027648654319805638}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4614844218085089, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021663747761732207}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.28123246363040955, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0027007119359494314}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2150097554160261, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002138899675268787}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.22970482247017235, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00197438239706358}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4143281149202266, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002969403717017417}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.32090483861163693, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023977607834718777}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3427415979760685, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020357821149855123}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.46330716929389093, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031399338067163917}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3607474288264691, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002652994557246981}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3847530991565415, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022220842320301534}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..d2c6d3faa58d5f526aa922119e6b4a723318cdfb --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.349674798491353, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.2620211666324464}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5580977741060988, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003152695337297477}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4318929339624608, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027232610944967796}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.46359996980874846, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021412883557770652}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.282134536476671, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026354539351566403}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21417820926964778, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0020891541191163186}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2303452786552104, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019438168093482682}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.416156553657584, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002921110787140179}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3201090740050369, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023555592018131553}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.34414481054807766, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020332629423129916}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.46739254821741905, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031264669970885233}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3608544692904568, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026213087830254975}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.38760985028639305, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002239740316941447}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_gem_xsum_article_DOC_summary_0.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..fb7411ba4d0c13d1636758f87739c05da52681f6 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.15826471323077757, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002220888825623518}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.33446079519909305, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004514327805033082}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.20682985522235142, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002563714031203911}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03352875592509948, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0012249216700579001}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07724702868679346, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002831153557559276}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04522961690526853, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015798221742638174}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.1175738942721655, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016420722284867819}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2512371460248057, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003517155084540941}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1540627639559492, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019062590295789597}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.12200871250100262, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017899421156850875}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.26225586640138876, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0040169777118884645}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.16037094135484917, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021767207134326364}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.8758881711718112, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06414775170791744}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_gem_xsum_article_DOC_summary_1.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..25a628b4f22657a9e25bcd638ef3f66c0abbc09f --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12818817016431805, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018328880795144842}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3134061916653512, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004249929100773614}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17974510059897553, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002465987111038623}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.026250493846268503, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010076577262875675}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06742089722818025, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002693226728725516}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0373103830110333, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014354470060085698}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10061028549996975, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013774691842900675}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.24845939880798545, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003416347548558214}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14142245724497754, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001878295390484601}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10150911522087737, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014800824882477777}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2508723286793532, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003661797386209274}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14274126658034353, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020267265379362424}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.4877593210481137, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0786306768078736}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_gem_xsum_article_DOC_summary_2.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..cbaf287696018bd89a2cde2315972d04dcad02a8 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1272806924752953, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018087494542713912}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3130608961268874, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0041974862144461686}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17878904396689269, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00243376415334862}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02583921544659326, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009884044996505668}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06617476951559573, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0026088727674303245}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03670452685866085, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014016808833113095}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10041567883791579, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013584120767201249}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.24945606421737898, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0033610500271998743}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1413735388750044, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018450620692794725}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10073064727294082, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014545958847864858}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2508016791258512, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003602192602128567}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1419412969578001, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019890982108612416}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.5028153336333563, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07627640892766649}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_gem_xsum_article_DOC_summary_3.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..88ac106bc7571e2807eea0c5e52d30576acfd42d --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12623940374443, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0020446872317856236}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2970674436926099, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004510700325635104}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17306626516595003, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002606230170311302}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.025227030531171757, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00099984133264785}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.062156816006725055, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0025180978338057826}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.035237949376792976, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013859609116877547}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09928754777119025, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015425645112311069}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.23556252311929232, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003514098352558134}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1364033778870308, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019668305545097802}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09980705574148897, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016450051443727947}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.23669283330652355, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0037461804498405958}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13711597851384225, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002115039571938244}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.4368429875503554, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06985209662692778}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_gem_xsum_article_DOC_summary_4.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..65f2022580d15f5d38e53e311a337800e13b78a3 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.04214614218832052, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0026107746281583345}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.07655987772910962, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004452578402829074}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.048983292472562175, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0027644367309486977}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.007766000425718809, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007712139973537835}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.016794467199208594, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015960487560251384}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.01004804307836075, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009374479444550356}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.03417705858833514, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002144817166226441}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0611728887335129, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003535855187265437}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.03916437496912562, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021783828707728175}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.034323144988876814, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0021857348636160957}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.06145859851518466, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003628835438679055}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.03924383294112677, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002217328487694054}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.6717545873809246, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11330796657627773}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_gem_xsum_article_DOC_summary_5.json b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..942a36097474bb51c0093ca9e32c59d99e62054f --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/agg.4b284b21bc4seed1_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0037186815835539475, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0010258999278355571}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.002971904217615499, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0007902202653735375}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.0032528851804285172, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008749082661343398}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0008463719964829843, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00034301989930096845}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.000656010656010656, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0002674722049726138}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0007279332281340716, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0002925088475825617}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.002842770899097203, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0007736763310592724}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0023409347627226925, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.000630308860618993}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0025265679608804242, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006801945500560441}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.002946821953481221, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0008038704154971681}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.00243903003284904, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0006639365437911874}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.002627465953010381, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0007127898651991914}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.1058893408297867e-36, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 2.1724367476442414e-31}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c8d62dc6586c2be65e06af8088af6979f8fbaf94 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38bbf5cc6cf30578575fcbb56fa3b2d745b4c9054fd49ef7428ed9dfe7a0fba5 +size 4158681 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4d1ea3f1a9239a945f25853076c8a4ce953d09e7 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c73b140c484073a4ea8053b1c16cab3d500b6b2c6b51a23c23ab09700eb327ad +size 5140334 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4c753da44c458fe22d3fa93f5c1d4cade5304c2b --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c17b03305fbb4bb0b164be5fd8e4e07eb29f926a6881467b75e6572da0b43b7 +size 6052674 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..357d9b1422ba394357c0e1df8b134e3715794e37 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6b6daf6cb36784a59c022f0c187b6f3972aceaae197595124bb94230feabebe +size 6959636 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7d8bebdfc02dcbdb51e550f93706d1cf40e925ee --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5485b99066dca4e28647a5df5d18103abc1287b04c7c614f7a7a9492f02b5d59 +size 7859815 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d819debe98a17cca19ce0af55068863fd7428467 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bbe79283fe7d23d3612d209e2fb4a77742572ca965642e5e21b0d437d27cfdb +size 8785235 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0c9837efab6e75e973c426052f5dc5f47f5c8ad6 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08e22e12717fa36094108902a70dfc34fc84ea736e93e4e1335b5b2d2a26086a +size 7688658 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..319e936d9e3e3c04fd2380e4cf8c148d8f292510 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:673a6cd1a1202d2b5549e14eac761c34b3454c96dff80d3589020f440f6c1d5d +size 13311942 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8752968124a839333b94976d32a2aeedec68067d --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:021d728751a69af4e9bf63e905391fcb948925df336f1d24c1d26c5f8961039e +size 18898719 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8d6206f7142621a56b0243737fbc00c28cb1be94 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29a6e186cd94937f73f4d20aadb450ea992e94feeea800d13073042e67a69e4c +size 24316163 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..97d79b2123bb0dcc2986d111bd286e604e0974d8 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:195080d05b3233d4a59a7ae075143e69d25afbb31414bb338266e40fe29b189a +size 29466016 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..35b55e160dcab52c6928109b1465c9d6a0a23e66 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44494ad97a9f9696e1bdffb36df72644d9e213f2b101e670371e05026c238778 +size 34798571 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6a4071c7cbf5dbbeb058b52367dead234553fc02 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4cf04217bb9b80915a89d69711aae95b7ad28bbec54dc8138ebd4eaa9c2e0c2 +size 4516428 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..69a1b84c1830d35509a81a890d3c9c59ae455fe9 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4348ecb5633d92196154b26deb943e93c00bcb0bbd7234d1d8a4f727fa97a441 +size 5157323 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b7d65d95c53cc29bf6d588d2cd397fb81c3f51c9 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f11fe76cca799015059c9110901c93203be0de3486f08a37ad14733926aca9f0 +size 6143212 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f5e8c0257401bf7bb15d97e641e00ca0e343834e --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e75c49c55ef1f3646fea2f50425644e9e70f0071315f26fe27e79440ee00d465 +size 7204549 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c4a0d92c5bf28f00eec2b261f4df014ba1ee5d6e --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d477f53548d63f2cc59f465bee3afb79168a44e9819b2516ca2f640e5f9b72e +size 8267826 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b5cb2f89fca82a10e431f57535e34ec53740a21b --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:444546afa16111dd5fe66a4f6c66cca28475a37a0208063ed66ba1674bb36a92 +size 9350935 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_gem_xsum_article_DOC_summary_0.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..30c45899d1ed82ce5aa5da9db376ae054bede328 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e35c5b4c358f7cbe07fa8ae28090a020b7f198a60dbe8ef8411f6f0d6aaad87 +size 2806300 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_gem_xsum_article_DOC_summary_1.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..45bd5bd9f9db4eb800620f0fa90d820b1ddcf3b3 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f2f782b99acd2da91e4ef7ea6005a79ca483e2ec2c4f632dfe48aab399a0834 +size 5101872 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_gem_xsum_article_DOC_summary_2.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..92183b7a0e84563f765188e42b99814edde71334 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43869cb45bbc83e269592da01511d84b1a6ac6d161da8547015ae237a5fa2759 +size 7376317 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_gem_xsum_article_DOC_summary_3.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e568e421c9482ba1ca18b3a4e55d05f3fc50896c --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d7d731cea34107f599e83401e72ec4a600b86cf4a9922cd99a7e90a01e8d920 +size 9644184 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_gem_xsum_article_DOC_summary_4.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..de2f0cd16d26527feed27595e10a22a6fd4fa9c0 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:543c58726f2b77e9df4e0ee7f9a76d8b7527baa15ca11007ce33be317e35c750 +size 11671637 diff --git a/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_gem_xsum_article_DOC_summary_5.jsonl b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f04a8f13b6a7cfb9ff8c02c0974dfbbad0a4f123 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/examples.4b284b21bc4seed1_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f35b1da52766141e5418ff78e13da7a16b2724f874b9f3467cbc2c5b5650e4f +size 13897539 diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..ff8629035b7c71a080bcfe1efddcd4e4a12451bf --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.33272479915628694, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.031796098410938015 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06768598529946503, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001826760753754374 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.273245918626827, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004811539102181524 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09992028750901691, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002068624719484398 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.0319815601358353, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001123592878248015 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.132780352400067, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0031651283586402535 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.047572357019245066, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012754558397189623 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06526863289287767, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.00173604911565671 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2659429125520888, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004693559342531821 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09656759025734364, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0019482031642887698 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06475652685202478, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001750562854208181 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.261555669425398, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004531537846674438 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.09550510540717662, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019437957791240722 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..d7bb45025c677c5e7a358391f4c2bf3210d5ff9b --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5102447245370249, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.035376593830697835 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07172631396783712, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0015940647947642393 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3498874090683673, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005494538712125141 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11038438449277037, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019607246874588217 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03374360598633707, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0011472248278029387 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.17065910212771632, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0037615577096519314 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.0513340131604287, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012161196627700137 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06735170136224546, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014692804169579693 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.32775015583004236, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.005027007036378035 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10363295036370204, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0017764857744676573 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06821168744641012, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0015257497030318006 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3303827812174427, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.005034171208777432 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10476642693447911, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001844638754248624 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..7ecbd691e76ea89a0de4e52016efa4a1e731999c --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6028097084858823, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03400607345942724 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07447162662420612, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001363119521612849 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.39133197093760397, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005455286809780116 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11747286047545925, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018369017696682527 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03418924065620199, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008008890429324677 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.19324361036894205, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0038848529810624356 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.054159534529018366, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00112831864459488 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06854684035035577, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012086804724451806 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.35968605242390533, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004868740565794037 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10807779989120546, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001612487862874725 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.0706586243525616, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012889308612371538 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.36945068896305344, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0050409156545949945 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11132296857949775, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017256589790344656 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..4240fd86fd511527601cbe68f9397817087920c3 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.701781042691669, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.028304269361164428 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07483297992459019, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013297778153553014 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.40075245309368346, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005510805436391809 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.1186720883935396, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018557604964665015 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03405829473639484, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007867378650100502 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1965036741041513, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0039013830928258273 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05434522629151618, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011369092672670533 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06814102346988, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001142595819228343 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.36375561641075393, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004784629751764729 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10798420755086514, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001585937192657532 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.0705542561432147, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012322784221801353 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.376368921472397, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.005042206855487164 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11180266475563037, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017161756564434687 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..f8e6a584b78a2b3fd92cd598caacc612f5667fd2 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.7208477776174064, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03611939053214278 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07573522475977945, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012828287982675156 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4140707617730325, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005500874400250013 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12065545317279747, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017878857789550631 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03464259052791206, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007595549203652654 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20555557401100102, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003919174647287531 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05546852434740693, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001093391566003447 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06882833861974198, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.00110954922342777 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.37506782401870103, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004831464763832598 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10954384971885704, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001541389309718117 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07144735748031365, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011999248890901264 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3887273820866732, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.005052183598911252 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11373501038504552, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016710119042870925 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..a09f682d6a6fcc08c0546b209fa05f3991a222b4 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.8098840843933562, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.042922709276963275 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07551077098651218, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0011967463119907174 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.42778952645041607, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005509208476502683 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12112590895694009, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016877211094516577 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03488380229207791, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007164646591878178 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.21683909270039745, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0040700970178128 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05638496281385114, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010526694616578302 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06816852013471421, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0010570419074259674 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3851255216729155, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004804722289936786 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1091505948569381, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014719382275165554 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07111730496416463, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011271521292987115 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.40225015185589585, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.005071744746719108 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1139947508286874, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015813085492093937 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..3f51e9a4c89e9bab3db83cb85f5c4ed1ed4f76ea --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.15167532178589505, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0019073207185280718 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2612333406333799, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0026793907173360246 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17820031429089941, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001867331386262004 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.03148570054286659, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007720646786309003 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05626578766960683, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0014278552081629383 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03716728942279169, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008623486309823396 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.116140614745089, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013156638447678107 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.2083623246576857, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0021996516173952707 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13833033412198834, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013282918104537548 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.13994812048897234, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017518520260318953 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2422441673257693, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0024926109810662115 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.16463728733959723, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017151648189316772 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.604770833205388, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.045152527476120426 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..43ad57f0c92aa4777bc653f7d9d1579fcae9e5f7 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.17995455895644027, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0021143646937022468 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.29822507703809786, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0029202005379262794 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.20675601444211894, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019509220985923807 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.04280457785161096, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0010705605908791504 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.07256480707864589, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016883207002489 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0485299590695294, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.000987435381157907 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.128484042233791, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014903515496972157 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.21893094707653085, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022685657736807928 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.14838617751760952, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013193585886492735 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1682253075781992, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001983258112076011 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.27945450640399006, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002751044005784169 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.19330419331545362, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001817315871702104 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.3579628914986084, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.06443336501226987 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..6d3d66556efa186818d2908640cde072c74683d9 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1942548807242778, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0023454682458510967 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.3038516433424921, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0028161999694894368 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.21447969004311607, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018895718255246762 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0492948803130678, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0011990391917610706 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0782436349256461, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0017608820777292064 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05328365330541802, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010288709039921085 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1390228041509367, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0017234767147472074 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.22270032621786837, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002252792096654515 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15374474737766516, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013038739578348723 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.18265776299811193, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0022101445170749252 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.28667373859931605, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002687218604461664 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.2018034121125251, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017698133555769187 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.770701026929389, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.055755441860674826 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..950c8512ebbea8391002328be2f5fc69179a1f1a --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.16605472663049203, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0026215736776626004 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.24674896622444079, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0032942062409122403 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17584661717144687, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0022080154978502656 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.041252526415028114, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0012562811469129071 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06385056201459363, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0017227611606126488 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04324074407846396, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001030508940585308 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.12107072019854664, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0020206323069935596 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.18199308221887076, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0025743010221870987 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.12719556123913905, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015628923302645156 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.15696755228304862, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0025037796725520395 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.23345046038796602, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.003144339747645053 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.166023927031211, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020868492894240698 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.6943492797886797, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.048945628141051856 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..ce71a54985f587b5c0e9a3490caaee9c23517b19 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.05342346190272065, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002056550316894281 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.07978774494235341, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0028101467900972705 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.05454947380142532, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001847757669359123 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.012258350990130428, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007138900312061555 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.02028789716505487, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0011428305900431244 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.01286346881894465, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0006471740657104415 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.040366367324606266, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0016113191055682687 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.06061271598925825, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0021836846333784096 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.0407204750127799, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013676744674585327 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.050133371793595845, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0019436034391785793 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.07473111376648439, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0026329914241005055 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.05108474776360767, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017328648234254131 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.5943697556411244, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.030734589500314064 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..f61c79303e296fbd1ad960919195507e8c56f760 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.008364381665919872, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0008819285241796705 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.012634998947429131, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0012520411703047264 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.008385094317414335, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0007962608828602142 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0019514480000772428, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0002950485643713033 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0034586914827538628, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.000553626619531344 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0020213111085609944, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0002694978086459766 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.006554032979312583, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0006990429427874044 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.010080116076976064, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0010433208473045565 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.006545584095103677, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0006266707040781551 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.007976144780102256, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0008419903349386873 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.012040227491122851, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.001201302499319246 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.007958529393460171, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0007541972102063722 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.5595918572619473e-06, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 2.8487471872210672e-06 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..9f9726323ae27e535f946b12944098f9628d520e --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 0.01599277764818925, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.004308927933825235 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.012870158730159176, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.00026604075009303314 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.02306192594226545, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0005060585834775515 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.016178489257483206, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0003336557540954231 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.00011382113821138212, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 3.0353975217624302e-05 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.00016007109878338666, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 4.471587603586543e-05 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.00012949433318118156, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 3.494334474550083e-05 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.012870158730159176, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.00026604075009303314 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.02306192594226545, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0005060585834775515 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.016178489257483206, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0003336557540954231 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.012401587301587743, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0002495014907480676 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.022186928253083223, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.00046927560289039864 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.015580467425438196, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0003114685494407546 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..789896c092f7b4897a051fcd5a2eb42acc7bd775 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 9.29730492833567, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.07258438562915104 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4508609495206719, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0036311478842959532 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4256279851535847, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002998743529748849 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.40179356473852385, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0024053635164423257 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.20803358909759323, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002540052178876273 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.19234516196309973, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021041392938787457 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.1821558520162302, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0018839477104031566 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.33647256551604726, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029522675564527113 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.32133682780546957, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025106371554624155 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3001108360092531, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0019304143016397508 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.36851923372760476, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0033065014951933927 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3458837990441542, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027230707350231853 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3272696975463691, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002280428848910135 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..b9a65cc2e145fe977d742d1aac507971cda6a19f --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.759775802861823, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1293139727386451 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5296073064762413, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0033783994941725144 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4363790698973518, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029267544023528365 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4496590978589395, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002303602978907222 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.25851059818334, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026408591114483963 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.20978543572844377, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002146572930760848 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2160790254378622, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001955317829071995 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.39232032536879197, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029964581011695346 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3219131393183246, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024670087975040625 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.33140579758047195, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020369186351820263 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4374911840880169, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0032563934045941744 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.35889049112539584, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027163755824492135 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3703216404379091, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022909574817028392 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..848aac56dd063649ff0971b268635fcdc2bd7e56 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.39712229435215, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.2190368432916537 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5434706515030117, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032446983744738762 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.43747355273891847, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028993863830845397 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4585328203108971, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022516911107973987 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.27356714226869305, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026390580957758175 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21639197788244496, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021805025438367607 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2270812503617402, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019758386181450292 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.40618251147113754, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029740816706799833 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3236014788599963, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024273522496127556 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.34028277436237736, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020545641994681512 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4532770963097311, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031647100865919084 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.36298447462453876, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026887391183781422 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.38125456908954924, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002257169022713513 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..15e53642a3b140e0b7a714a0cf62e17c0c819f95 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.278538903088437, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.19304270040523466 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5550942770770999, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.00321920680863295 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.43254174724244665, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027648654319805638 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4614844218085089, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0021663747761732207 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.28123246363040955, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0027007119359494314 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2150097554160261, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002138899675268787 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.22970482247017235, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.00197438239706358 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4143281149202266, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002969403717017417 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.32090483861163693, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023977607834718777 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3427415979760685, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020357821149855123 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.46330716929389093, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031399338067163917 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3607474288264691, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002652994557246981 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3847530991565415, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022220842320301534 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..9fb0055f097f2d898a4bdbbe513fb04cbc12a69f --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.349674798491353, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.2620211666324464 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5580977741060988, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003152695337297477 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4318929339624608, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027232610944967796 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.46359996980874846, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0021412883557770652 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.282134536476671, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026354539351566403 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21417820926964778, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0020891541191163186 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2303452786552104, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019438168093482682 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.416156553657584, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002921110787140179 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3201090740050369, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023555592018131553 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.34414481054807766, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020332629423129916 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.46739254821741905, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031264669970885233 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3608544692904568, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026213087830254975 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.38760985028639305, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002239740316941447 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_gem_xsum_article_DOC_summary_0.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..662f1ba0aea9847412f1ee4b6e54c23e50342c85 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.15826471323077757, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002220888825623518 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.33446079519909305, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004514327805033082 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.20682985522235142, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002563714031203911 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03352875592509948, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0012249216700579001 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07724702868679346, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002831153557559276 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04522961690526853, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0015798221742638174 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.1175738942721655, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0016420722284867819 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2512371460248057, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003517155084540941 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1540627639559492, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019062590295789597 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.12200871250100262, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0017899421156850875 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.26225586640138876, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0040169777118884645 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.16037094135484917, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0021767207134326364 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.8758881711718112, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.06414775170791744 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_gem_xsum_article_DOC_summary_1.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..70cd731c4e2fd5ba35dcdde90815269a6da8ba8f --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12818817016431805, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018328880795144842 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3134061916653512, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004249929100773614 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17974510059897553, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002465987111038623 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.026250493846268503, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010076577262875675 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06742089722818025, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002693226728725516 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0373103830110333, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014354470060085698 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10061028549996975, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013774691842900675 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.24845939880798545, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003416347548558214 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14142245724497754, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001878295390484601 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10150911522087737, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014800824882477777 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2508723286793532, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003661797386209274 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14274126658034353, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020267265379362424 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.4877593210481137, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.0786306768078736 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_gem_xsum_article_DOC_summary_2.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..cff160f055aef00c731598fa9ee23e81c560b444 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1272806924752953, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018087494542713912 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3130608961268874, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0041974862144461686 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17878904396689269, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.00243376415334862 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02583921544659326, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009884044996505668 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06617476951559573, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0026088727674303245 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03670452685866085, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014016808833113095 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10041567883791579, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013584120767201249 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.24945606421737898, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0033610500271998743 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1413735388750044, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018450620692794725 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10073064727294082, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014545958847864858 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2508016791258512, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003602192602128567 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1419412969578001, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0019890982108612416 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.5028153336333563, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07627640892766649 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_gem_xsum_article_DOC_summary_3.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..46591d23c7dc8cafe8bea09b965d9d0f7ec2af58 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12623940374443, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0020446872317856236 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2970674436926099, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004510700325635104 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17306626516595003, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002606230170311302 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.025227030531171757, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00099984133264785 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.062156816006725055, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0025180978338057826 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.035237949376792976, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0013859609116877547 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09928754777119025, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0015425645112311069 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.23556252311929232, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003514098352558134 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1364033778870308, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019668305545097802 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09980705574148897, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0016450051443727947 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.23669283330652355, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0037461804498405958 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13711597851384225, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002115039571938244 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.4368429875503554, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.06985209662692778 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_gem_xsum_article_DOC_summary_4.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..c77c34b7ff638646caf4ea7c40ab3efeca24a0d5 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.04214614218832052, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0026107746281583345 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.07655987772910962, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004452578402829074 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.048983292472562175, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0027644367309486977 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.007766000425718809, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0007712139973537835 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.016794467199208594, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0015960487560251384 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.01004804307836075, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0009374479444550356 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.03417705858833514, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.002144817166226441 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0611728887335129, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003535855187265437 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.03916437496912562, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0021783828707728175 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.034323144988876814, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0021857348636160957 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.06145859851518466, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003628835438679055 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.03924383294112677, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002217328487694054 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.6717545873809246, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.11330796657627773 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_gem_xsum_article_DOC_summary_5.json b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..82c504e8552cb1e64946ce3941447f4706d34204 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/generation/slim.4b284b21bc4seed1_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0037186815835539475, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0010258999278355571 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.002971904217615499, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0007902202653735375 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.0032528851804285172, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0008749082661343398 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0008463719964829843, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00034301989930096845 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.000656010656010656, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0002674722049726138 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0007279332281340716, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0002925088475825617 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.002842770899097203, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0007736763310592724 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0023409347627226925, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.000630308860618993 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0025265679608804242, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0006801945500560441 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.002946821953481221, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0008038704154971681 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.00243903003284904, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0006639365437911874 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.002627465953010381, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0007127898651991914 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.1058893408297867e-36, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 2.1724367476442414e-31 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_0.json b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_0.json new file mode 100644 index 0000000000000000000000000000000000000000..a3bf8e3018b0efbc3058006e428aca902ed2a2ea --- /dev/null +++ b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.332, + "acc_stderr": 0.014899597242811482 + }, + "anli_r2": { + "acc": 0.324, + "acc_stderr": 0.014806864733738857 + }, + "anli_r3": { + "acc": 0.3491666666666667, + "acc_stderr": 0.013767075395077247 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.36493558776167473 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.042295258468165065 + }, + "hellaswag": { + "acc": 0.4695279824736108, + "acc_stderr": 0.004980506329407586, + "acc_norm": 0.6156144194383589, + "acc_norm_stderr": 0.0048545552940175395 + }, + "rte": { + "acc": 0.5451263537906137, + "acc_stderr": 0.029973636495415252 + }, + "winogrande": { + "acc": 0.5832675611681136, + "acc_stderr": 0.013856250072796316 + }, + "storycloze_2016": { + "acc": 0.7199358631747729, + "acc_stderr": 0.01038376499392048 + }, + "boolq": { + "acc": 0.6220183486238532, + "acc_stderr": 0.008480656964585246 + }, + "arc_easy": { + "acc": 0.6018518518518519, + "acc_stderr": 0.010044662374653396, + "acc_norm": 0.5286195286195287, + "acc_norm_stderr": 0.010242962617927197 + }, + "arc_challenge": { + "acc": 0.27474402730375425, + "acc_stderr": 0.013044617212771227, + "acc_norm": 0.295221843003413, + "acc_norm_stderr": 0.013329750293382316 + }, + "sciq": { + "acc": 0.832, + "acc_stderr": 0.011828605831454267, + "acc_norm": 0.751, + "acc_norm_stderr": 0.013681600278702296 + }, + "piqa": { + "acc": 0.750272034820457, + "acc_stderr": 0.010099232969867483, + "acc_norm": 0.7600652883569097, + "acc_norm_stderr": 0.009963625892809545 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_0_lm-eval_global_step80108_2023-02-15-11-04-03_0shots_backup.json b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_0_lm-eval_global_step80108_2023-02-15-11-04-03_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..a3bf8e3018b0efbc3058006e428aca902ed2a2ea --- /dev/null +++ b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_0_lm-eval_global_step80108_2023-02-15-11-04-03_0shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.332, + "acc_stderr": 0.014899597242811482 + }, + "anli_r2": { + "acc": 0.324, + "acc_stderr": 0.014806864733738857 + }, + "anli_r3": { + "acc": 0.3491666666666667, + "acc_stderr": 0.013767075395077247 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.36493558776167473 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.042295258468165065 + }, + "hellaswag": { + "acc": 0.4695279824736108, + "acc_stderr": 0.004980506329407586, + "acc_norm": 0.6156144194383589, + "acc_norm_stderr": 0.0048545552940175395 + }, + "rte": { + "acc": 0.5451263537906137, + "acc_stderr": 0.029973636495415252 + }, + "winogrande": { + "acc": 0.5832675611681136, + "acc_stderr": 0.013856250072796316 + }, + "storycloze_2016": { + "acc": 0.7199358631747729, + "acc_stderr": 0.01038376499392048 + }, + "boolq": { + "acc": 0.6220183486238532, + "acc_stderr": 0.008480656964585246 + }, + "arc_easy": { + "acc": 0.6018518518518519, + "acc_stderr": 0.010044662374653396, + "acc_norm": 0.5286195286195287, + "acc_norm_stderr": 0.010242962617927197 + }, + "arc_challenge": { + "acc": 0.27474402730375425, + "acc_stderr": 0.013044617212771227, + "acc_norm": 0.295221843003413, + "acc_norm_stderr": 0.013329750293382316 + }, + "sciq": { + "acc": 0.832, + "acc_stderr": 0.011828605831454267, + "acc_norm": 0.751, + "acc_norm_stderr": 0.013681600278702296 + }, + "piqa": { + "acc": 0.750272034820457, + "acc_stderr": 0.010099232969867483, + "acc_norm": 0.7600652883569097, + "acc_norm_stderr": 0.009963625892809545 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_1.json b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_1.json new file mode 100644 index 0000000000000000000000000000000000000000..b63df694ea2ddfdec3ea8fdec7e22637cc7bc4d5 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.321, + "acc_stderr": 0.014770821817934642 + }, + "anli_r2": { + "acc": 0.321, + "acc_stderr": 0.014770821817934647 + }, + "anli_r3": { + "acc": 0.3333333333333333, + "acc_stderr": 0.013613950010225603 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.35714285714285704 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.04408440022768079 + }, + "hellaswag": { + "acc": 0.4691296554471221, + "acc_stderr": 0.004980262025472478, + "acc_norm": 0.6161123282214698, + "acc_norm_stderr": 0.004853371646239242 + }, + "rte": { + "acc": 0.5667870036101083, + "acc_stderr": 0.02982676408213828 + }, + "winogrande": { + "acc": 0.5651144435674822, + "acc_stderr": 0.013932814110418025 + }, + "storycloze_2016": { + "acc": 0.721004810261892, + "acc_stderr": 0.010371620932652793 + }, + "boolq": { + "acc": 0.5773700305810398, + "acc_stderr": 0.008639722698719023 + }, + "arc_easy": { + "acc": 0.6043771043771043, + "acc_stderr": 0.010033741393430986, + "acc_norm": 0.5686026936026936, + "acc_norm_stderr": 0.010162752847747501 + }, + "arc_challenge": { + "acc": 0.28668941979522183, + "acc_stderr": 0.013214986329274762, + "acc_norm": 0.3037542662116041, + "acc_norm_stderr": 0.013438909184778759 + }, + "sciq": { + "acc": 0.883, + "acc_stderr": 0.010169287802713329, + "acc_norm": 0.859, + "acc_norm_stderr": 0.011010914595992445 + }, + "piqa": { + "acc": 0.7519042437431991, + "acc_stderr": 0.010077118315574715, + "acc_norm": 0.7606093579978237, + "acc_norm_stderr": 0.00995588425029168 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_1_lm-eval_global_step80108_2023-02-15-11-04-03_1shots_backup.json b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_1_lm-eval_global_step80108_2023-02-15-11-04-03_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..b63df694ea2ddfdec3ea8fdec7e22637cc7bc4d5 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_1_lm-eval_global_step80108_2023-02-15-11-04-03_1shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.321, + "acc_stderr": 0.014770821817934642 + }, + "anli_r2": { + "acc": 0.321, + "acc_stderr": 0.014770821817934647 + }, + "anli_r3": { + "acc": 0.3333333333333333, + "acc_stderr": 0.013613950010225603 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.35714285714285704 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.04408440022768079 + }, + "hellaswag": { + "acc": 0.4691296554471221, + "acc_stderr": 0.004980262025472478, + "acc_norm": 0.6161123282214698, + "acc_norm_stderr": 0.004853371646239242 + }, + "rte": { + "acc": 0.5667870036101083, + "acc_stderr": 0.02982676408213828 + }, + "winogrande": { + "acc": 0.5651144435674822, + "acc_stderr": 0.013932814110418025 + }, + "storycloze_2016": { + "acc": 0.721004810261892, + "acc_stderr": 0.010371620932652793 + }, + "boolq": { + "acc": 0.5773700305810398, + "acc_stderr": 0.008639722698719023 + }, + "arc_easy": { + "acc": 0.6043771043771043, + "acc_stderr": 0.010033741393430986, + "acc_norm": 0.5686026936026936, + "acc_norm_stderr": 0.010162752847747501 + }, + "arc_challenge": { + "acc": 0.28668941979522183, + "acc_stderr": 0.013214986329274762, + "acc_norm": 0.3037542662116041, + "acc_norm_stderr": 0.013438909184778759 + }, + "sciq": { + "acc": 0.883, + "acc_stderr": 0.010169287802713329, + "acc_norm": 0.859, + "acc_norm_stderr": 0.011010914595992445 + }, + "piqa": { + "acc": 0.7519042437431991, + "acc_stderr": 0.010077118315574715, + "acc_norm": 0.7606093579978237, + "acc_norm_stderr": 0.00995588425029168 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_2.json b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_2.json new file mode 100644 index 0000000000000000000000000000000000000000..34b9b1a2a6ac3eb6c3454952b8b6cceefa32a1c5 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.325, + "acc_stderr": 0.014818724459095524 + }, + "anli_r2": { + "acc": 0.322, + "acc_stderr": 0.014782913600996678 + }, + "anli_r3": { + "acc": 0.335, + "acc_stderr": 0.013630871843821476 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.3018475149622691 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.4645488946425015, + "acc_stderr": 0.004977223485342027, + "acc_norm": 0.6139215295757817, + "acc_norm_stderr": 0.004858539527872464 + }, + "rte": { + "acc": 0.5595667870036101, + "acc_stderr": 0.029882123363118712 + }, + "winogrande": { + "acc": 0.579321231254933, + "acc_stderr": 0.013874526372008327 + }, + "storycloze_2016": { + "acc": 0.721004810261892, + "acc_stderr": 0.010371620932652793 + }, + "boolq": { + "acc": 0.5923547400611621, + "acc_stderr": 0.008594580270731615 + }, + "arc_easy": { + "acc": 0.6203703703703703, + "acc_stderr": 0.009958037725468575, + "acc_norm": 0.5959595959595959, + "acc_norm_stderr": 0.010069061649549549 + }, + "arc_challenge": { + "acc": 0.2883959044368601, + "acc_stderr": 0.013238394422428164, + "acc_norm": 0.302901023890785, + "acc_norm_stderr": 0.013428241573185349 + }, + "sciq": { + "acc": 0.893, + "acc_stderr": 0.009779910359847167, + "acc_norm": 0.879, + "acc_norm_stderr": 0.010318210380946088 + }, + "piqa": { + "acc": 0.750272034820457, + "acc_stderr": 0.010099232969867486, + "acc_norm": 0.750816104461371, + "acc_norm_stderr": 0.01009188277012021 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_2_lm-eval_global_step80108_2023-02-15-11-04-03_2shots_backup.json b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_2_lm-eval_global_step80108_2023-02-15-11-04-03_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..34b9b1a2a6ac3eb6c3454952b8b6cceefa32a1c5 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_2_lm-eval_global_step80108_2023-02-15-11-04-03_2shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.325, + "acc_stderr": 0.014818724459095524 + }, + "anli_r2": { + "acc": 0.322, + "acc_stderr": 0.014782913600996678 + }, + "anli_r3": { + "acc": 0.335, + "acc_stderr": 0.013630871843821476 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.3018475149622691 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.4645488946425015, + "acc_stderr": 0.004977223485342027, + "acc_norm": 0.6139215295757817, + "acc_norm_stderr": 0.004858539527872464 + }, + "rte": { + "acc": 0.5595667870036101, + "acc_stderr": 0.029882123363118712 + }, + "winogrande": { + "acc": 0.579321231254933, + "acc_stderr": 0.013874526372008327 + }, + "storycloze_2016": { + "acc": 0.721004810261892, + "acc_stderr": 0.010371620932652793 + }, + "boolq": { + "acc": 0.5923547400611621, + "acc_stderr": 0.008594580270731615 + }, + "arc_easy": { + "acc": 0.6203703703703703, + "acc_stderr": 0.009958037725468575, + "acc_norm": 0.5959595959595959, + "acc_norm_stderr": 0.010069061649549549 + }, + "arc_challenge": { + "acc": 0.2883959044368601, + "acc_stderr": 0.013238394422428164, + "acc_norm": 0.302901023890785, + "acc_norm_stderr": 0.013428241573185349 + }, + "sciq": { + "acc": 0.893, + "acc_stderr": 0.009779910359847167, + "acc_norm": 0.879, + "acc_norm_stderr": 0.010318210380946088 + }, + "piqa": { + "acc": 0.750272034820457, + "acc_stderr": 0.010099232969867486, + "acc_norm": 0.750816104461371, + "acc_norm_stderr": 0.01009188277012021 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_3.json b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_3.json new file mode 100644 index 0000000000000000000000000000000000000000..10d6818e7e42c4482e1474a8f0ec6c0f143fd7b8 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.318, + "acc_stderr": 0.014734079309311901 + }, + "anli_r2": { + "acc": 0.33, + "acc_stderr": 0.01487687202745673 + }, + "anli_r3": { + "acc": 0.32916666666666666, + "acc_stderr": 0.01357080625843363 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.0672477765493766, + "f1": 0.3314669652855543 + }, + "copa": { + "acc": 0.83, + "acc_stderr": 0.03775251680686371 + }, + "hellaswag": { + "acc": 0.4684325831507668, + "acc_stderr": 0.0049798268294007665, + "acc_norm": 0.6182035451105358, + "acc_norm_stderr": 0.004848341560492134 + }, + "rte": { + "acc": 0.5595667870036101, + "acc_stderr": 0.02988212336311871 + }, + "winogrande": { + "acc": 0.5698500394632992, + "acc_stderr": 0.013914685094716698 + }, + "storycloze_2016": { + "acc": 0.7172634954569749, + "acc_stderr": 0.01041380648612127 + }, + "boolq": { + "acc": 0.6024464831804281, + "acc_stderr": 0.00855952325693682 + }, + "arc_easy": { + "acc": 0.6136363636363636, + "acc_stderr": 0.00999129677815963, + "acc_norm": 0.6102693602693603, + "acc_norm_stderr": 0.01000716939179705 + }, + "arc_challenge": { + "acc": 0.28668941979522183, + "acc_stderr": 0.013214986329274776, + "acc_norm": 0.302901023890785, + "acc_norm_stderr": 0.013428241573185347 + }, + "sciq": { + "acc": 0.903, + "acc_stderr": 0.009363689373248107, + "acc_norm": 0.886, + "acc_norm_stderr": 0.010055103435823335 + }, + "piqa": { + "acc": 0.749727965179543, + "acc_stderr": 0.010106561880089782, + "acc_norm": 0.7557127312295974, + "acc_norm_stderr": 0.01002476517228425 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_3_lm-eval_global_step80108_2023-02-15-11-04-03_3shots_backup.json b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_3_lm-eval_global_step80108_2023-02-15-11-04-03_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..10d6818e7e42c4482e1474a8f0ec6c0f143fd7b8 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_3_lm-eval_global_step80108_2023-02-15-11-04-03_3shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.318, + "acc_stderr": 0.014734079309311901 + }, + "anli_r2": { + "acc": 0.33, + "acc_stderr": 0.01487687202745673 + }, + "anli_r3": { + "acc": 0.32916666666666666, + "acc_stderr": 0.01357080625843363 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.0672477765493766, + "f1": 0.3314669652855543 + }, + "copa": { + "acc": 0.83, + "acc_stderr": 0.03775251680686371 + }, + "hellaswag": { + "acc": 0.4684325831507668, + "acc_stderr": 0.0049798268294007665, + "acc_norm": 0.6182035451105358, + "acc_norm_stderr": 0.004848341560492134 + }, + "rte": { + "acc": 0.5595667870036101, + "acc_stderr": 0.02988212336311871 + }, + "winogrande": { + "acc": 0.5698500394632992, + "acc_stderr": 0.013914685094716698 + }, + "storycloze_2016": { + "acc": 0.7172634954569749, + "acc_stderr": 0.01041380648612127 + }, + "boolq": { + "acc": 0.6024464831804281, + "acc_stderr": 0.00855952325693682 + }, + "arc_easy": { + "acc": 0.6136363636363636, + "acc_stderr": 0.00999129677815963, + "acc_norm": 0.6102693602693603, + "acc_norm_stderr": 0.01000716939179705 + }, + "arc_challenge": { + "acc": 0.28668941979522183, + "acc_stderr": 0.013214986329274776, + "acc_norm": 0.302901023890785, + "acc_norm_stderr": 0.013428241573185347 + }, + "sciq": { + "acc": 0.903, + "acc_stderr": 0.009363689373248107, + "acc_norm": 0.886, + "acc_norm_stderr": 0.010055103435823335 + }, + "piqa": { + "acc": 0.749727965179543, + "acc_stderr": 0.010106561880089782, + "acc_norm": 0.7557127312295974, + "acc_norm_stderr": 0.01002476517228425 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_4.json b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_4.json new file mode 100644 index 0000000000000000000000000000000000000000..5b948a0034e9368a4c25af8746e8aa66142814a0 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.321, + "acc_stderr": 0.01477082181793464 + }, + "anli_r2": { + "acc": 0.342, + "acc_stderr": 0.01500870618212173 + }, + "anli_r3": { + "acc": 0.32083333333333336, + "acc_stderr": 0.013480882752851552 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644647, + "f1": 0.35968427443837275 + }, + "copa": { + "acc": 0.82, + "acc_stderr": 0.038612291966536955 + }, + "hellaswag": { + "acc": 0.465345548695479, + "acc_stderr": 0.004977782217582457, + "acc_norm": 0.6182035451105358, + "acc_norm_stderr": 0.004848341560492137 + }, + "rte": { + "acc": 0.5595667870036101, + "acc_stderr": 0.029882123363118712 + }, + "winogrande": { + "acc": 0.5753749013417522, + "acc_stderr": 0.013891893150264224 + }, + "storycloze_2016": { + "acc": 0.7242116515232496, + "acc_stderr": 0.010334748387645672 + }, + "boolq": { + "acc": 0.6125382262996942, + "acc_stderr": 0.00852066653613694 + }, + "arc_easy": { + "acc": 0.6224747474747475, + "acc_stderr": 0.009947227833469432, + "acc_norm": 0.601010101010101, + "acc_norm_stderr": 0.010048240683798745 + }, + "arc_challenge": { + "acc": 0.28071672354948807, + "acc_stderr": 0.013131238126975588, + "acc_norm": 0.3191126279863481, + "acc_norm_stderr": 0.013621696119173297 + }, + "sciq": { + "acc": 0.905, + "acc_stderr": 0.009276910103103305, + "acc_norm": 0.902, + "acc_norm_stderr": 0.009406619184621235 + }, + "piqa": { + "acc": 0.7464635473340587, + "acc_stderr": 0.010150090834551782, + "acc_norm": 0.7557127312295974, + "acc_norm_stderr": 0.010024765172284256 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_4_lm-eval_global_step80108_2023-02-15-11-04-03_4shots_backup.json b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_4_lm-eval_global_step80108_2023-02-15-11-04-03_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..5b948a0034e9368a4c25af8746e8aa66142814a0 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_4_lm-eval_global_step80108_2023-02-15-11-04-03_4shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.321, + "acc_stderr": 0.01477082181793464 + }, + "anli_r2": { + "acc": 0.342, + "acc_stderr": 0.01500870618212173 + }, + "anli_r3": { + "acc": 0.32083333333333336, + "acc_stderr": 0.013480882752851552 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644647, + "f1": 0.35968427443837275 + }, + "copa": { + "acc": 0.82, + "acc_stderr": 0.038612291966536955 + }, + "hellaswag": { + "acc": 0.465345548695479, + "acc_stderr": 0.004977782217582457, + "acc_norm": 0.6182035451105358, + "acc_norm_stderr": 0.004848341560492137 + }, + "rte": { + "acc": 0.5595667870036101, + "acc_stderr": 0.029882123363118712 + }, + "winogrande": { + "acc": 0.5753749013417522, + "acc_stderr": 0.013891893150264224 + }, + "storycloze_2016": { + "acc": 0.7242116515232496, + "acc_stderr": 0.010334748387645672 + }, + "boolq": { + "acc": 0.6125382262996942, + "acc_stderr": 0.00852066653613694 + }, + "arc_easy": { + "acc": 0.6224747474747475, + "acc_stderr": 0.009947227833469432, + "acc_norm": 0.601010101010101, + "acc_norm_stderr": 0.010048240683798745 + }, + "arc_challenge": { + "acc": 0.28071672354948807, + "acc_stderr": 0.013131238126975588, + "acc_norm": 0.3191126279863481, + "acc_norm_stderr": 0.013621696119173297 + }, + "sciq": { + "acc": 0.905, + "acc_stderr": 0.009276910103103305, + "acc_norm": 0.902, + "acc_norm_stderr": 0.009406619184621235 + }, + "piqa": { + "acc": 0.7464635473340587, + "acc_stderr": 0.010150090834551782, + "acc_norm": 0.7557127312295974, + "acc_norm_stderr": 0.010024765172284256 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_5.json b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_5.json new file mode 100644 index 0000000000000000000000000000000000000000..684984475060b4af2035ddb6b020d7bb8e1affe1 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.308, + "acc_stderr": 0.014606483127342763 + }, + "anli_r2": { + "acc": 0.329, + "acc_stderr": 0.014865395385928373 + }, + "anli_r3": { + "acc": 0.31916666666666665, + "acc_stderr": 0.013462309712005124 + }, + "cb": { + "acc": 0.5714285714285714, + "acc_stderr": 0.06672848092813059, + "f1": 0.40095238095238095 + }, + "copa": { + "acc": 0.81, + "acc_stderr": 0.03942772444036623 + }, + "hellaswag": { + "acc": 0.46634136626170086, + "acc_stderr": 0.004978462690966927, + "acc_norm": 0.6188010356502689, + "acc_norm_stderr": 0.00484688692976345 + }, + "rte": { + "acc": 0.5703971119133574, + "acc_stderr": 0.02979666882912467 + }, + "winogrande": { + "acc": 0.5674822415153907, + "acc_stderr": 0.013923911578623837 + }, + "storycloze_2016": { + "acc": 0.7226082308925709, + "acc_stderr": 0.010353267472010767 + }, + "boolq": { + "acc": 0.6168195718654435, + "acc_stderr": 0.008503021391450788 + }, + "arc_easy": { + "acc": 0.6308922558922558, + "acc_stderr": 0.009901987410242747, + "acc_norm": 0.6136363636363636, + "acc_norm_stderr": 0.009991296778159615 + }, + "arc_challenge": { + "acc": 0.28668941979522183, + "acc_stderr": 0.01321498632927477, + "acc_norm": 0.310580204778157, + "acc_norm_stderr": 0.013522292098053057 + }, + "sciq": { + "acc": 0.915, + "acc_stderr": 0.008823426366942331, + "acc_norm": 0.903, + "acc_norm_stderr": 0.009363689373248123 + }, + "piqa": { + "acc": 0.7464635473340587, + "acc_stderr": 0.010150090834551788, + "acc_norm": 0.7589771490750816, + "acc_norm_stderr": 0.009979042717267314 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_5_lm-eval_global_step80108_2023-02-15-11-04-03_5shots_backup.json b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_5_lm-eval_global_step80108_2023-02-15-11-04-03_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..684984475060b4af2035ddb6b020d7bb8e1affe1 --- /dev/null +++ b/4b284b21bc4seed1/evaluation/rankeval/4b284b21bc4seed1_5_lm-eval_global_step80108_2023-02-15-11-04-03_5shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.308, + "acc_stderr": 0.014606483127342763 + }, + "anli_r2": { + "acc": 0.329, + "acc_stderr": 0.014865395385928373 + }, + "anli_r3": { + "acc": 0.31916666666666665, + "acc_stderr": 0.013462309712005124 + }, + "cb": { + "acc": 0.5714285714285714, + "acc_stderr": 0.06672848092813059, + "f1": 0.40095238095238095 + }, + "copa": { + "acc": 0.81, + "acc_stderr": 0.03942772444036623 + }, + "hellaswag": { + "acc": 0.46634136626170086, + "acc_stderr": 0.004978462690966927, + "acc_norm": 0.6188010356502689, + "acc_norm_stderr": 0.00484688692976345 + }, + "rte": { + "acc": 0.5703971119133574, + "acc_stderr": 0.02979666882912467 + }, + "winogrande": { + "acc": 0.5674822415153907, + "acc_stderr": 0.013923911578623837 + }, + "storycloze_2016": { + "acc": 0.7226082308925709, + "acc_stderr": 0.010353267472010767 + }, + "boolq": { + "acc": 0.6168195718654435, + "acc_stderr": 0.008503021391450788 + }, + "arc_easy": { + "acc": 0.6308922558922558, + "acc_stderr": 0.009901987410242747, + "acc_norm": 0.6136363636363636, + "acc_norm_stderr": 0.009991296778159615 + }, + "arc_challenge": { + "acc": 0.28668941979522183, + "acc_stderr": 0.01321498632927477, + "acc_norm": 0.310580204778157, + "acc_norm_stderr": 0.013522292098053057 + }, + "sciq": { + "acc": 0.915, + "acc_stderr": 0.008823426366942331, + "acc_norm": 0.903, + "acc_norm_stderr": 0.009363689373248123 + }, + "piqa": { + "acc": 0.7464635473340587, + "acc_stderr": 0.010150090834551788, + "acc_norm": 0.7589771490750816, + "acc_norm_stderr": 0.009979042717267314 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ade49fdb7d3d5bbda82506a5e45156333e772d4 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9fac7539c92a1050a2195cf8b222b282b158033f693c69af82e37c93900ac4c +size 199058647 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a8c3ffdc52c2d254e23c540cdfe639e12863986 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:814eca016053d2079bb91ad685e8a4d7aa2d838ea2a2024cc255095bc4eb8681 +size 199058647 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1e2673aef562afc5a594336dfbd3d8f2572f4da --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47f8359ba90d45a5a8e32f422b75d0b297c09d7e3d0b896cedb3eadc603e1e7f +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7b49acfd275be3880199a163369905339240939 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abd1c35a216fbd0a67dc1ca3287f6801d3b9c7678480ae2335efa6aa28db5108 +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f24cedf51c2ac6848f59860fe7c91ae128012eef --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebb3c9533343f7646f99a18e6925d0ace20c9bd3df39cdb76452facb802d1276 +size 199058797 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd998804ded9201c31966e5dd829b122c7b1eff4 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7a84d7ab4abfd9f7097413494355f66fd76c99f89bb51e65a968b8dda09a28f +size 199058797 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad20c64bccecb342839519c6c2dd927a37472b28 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75fea0bf01e0290432acdcd6a2c8780cc964a62d5895a703c7f4b11c29501956 +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c40cb5b7b580eb0432891eaf7e2c5b1053ba1088 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7c05508404338e06c013dc9dc866f3279ad7e636c76f14a820cd497a086f42c +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b62b70943fd4fc6468c5bb28cdf19e2502c78d7 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df86cd09b615e33196cf3153149b11a8176c3784ab8e641738a6a1b289b581ff +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..490eef97c979c70726d1795822877400b4bd756c --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73774866a67ed5ce03e3e4bcbaa4779d16dd18f0682e6e30f7c009c8991ee804 +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e933cc722d24c77d11c1359cba2b83fcb7d2629 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6d6358e1fa0c64ba34407e8598d96714d0f09a2ab335330da0aff3e68006ab6 +size 199058797 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..357754eb1e0c4de08fde62149bff7f462c19995d --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42e7008de497d94303460990773c0798ccfbeff7f699221207f20cfdf232eb92 +size 199058797 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a62f5056fcee5ad4ef1ccc3ab48d088bc24d90c6 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cce22c8fb482edcadcfa68fc13f0ad5533c81690016a99059af3b429aa7de29 +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6a6c4bacfe1f291bc29491a29bd53ef098e714d --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03c1b802415b30ca5703f9c718e26301ab87dd09262b509311ecd549c10e0af8 +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebae707084d84aaf84ec99e5f5e4f31e656ce735 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:383bccc51b33d4843da74e3e58c55b941cbd7382508dea6a10ddd0451ddfe384 +size 199058669 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fec25aed790a5f62f6d8f6812e974d95f42efe75 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0226c7ae0b47934d47857bc9a9e6791712b58aeb8a7747606be6db348de3c7bd +size 199058669 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4eb255a2311988b51adecddb1f6c2a5d0519ee5 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5d35aa6f8eb9c93afcba2f9910c42035fa01ca5465949a7dbb648b0a18ca53d +size 199058797 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..620348ec97113d05d3549b3cb88678c4d0a1d499 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8635f8f62e5c2521d8ff6d4abece32e10c2f4b77f239eedb2f3f327e0e9576f8 +size 199058797 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0c172da0d8d09f334b08db667fb6216e99389b4 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7aecf015e1cd60f052c5d95b54500a155fdc115d8d0ed57be26a2c77398409eb +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0598328952bdaed66ef5bdc5898f86313c055ca9 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac89885ed4858f92e40abf38c6550d8ff207ad7a4a5d98e9b5b46402f9018502 +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5a380cbec7f35de0512e19533391754fcd65529 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc09ce3b41343a93361d4a93bf08673f76d7b89a2cc3b6df1f6bf11d7bcf0644 +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96503ff60cf22caa2ccc20f0bca924aeea3a9301 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b612c4b274b04636698920d27aa1052ad95674d57ff947f88a9013526304515f +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f72d82b99b3ba08bb33b2e3e195c5aa9ee594a8 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13a65ea3b9e3d2531d994007a4195a483bf83d03c8b19c5a684557a98ed5ff6a +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9380b5e150d6579addcebafde542ecd7368e474f --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dfe76dc46d225f8e73c059dc38990e050587d5f8d98785faeb509b483c02f8d +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d13195eafea59e7e62ff44d191e82f978e23e6f0 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6097f2d34ff7063f4120963ca618107779f12c57bcbc48c911e6fcef5c8e3fb5 +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b04275c3c4ce7944ea790224d948dc2d5399f44 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00e39d47fc6ebc09aafac281581a596084b10d2c7dddb75ba895b6bd7a884acf +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc2d4b325e9c287f3a5cda81c212d05c90806239 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18bf93f7c5c1b7275c62b683fdfd1e4ad6d91efb84482a6936fc30558a1f69bd +size 199058797 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2fff41a8f0ea9e28b1d5f6c075ffe9a43f386ff --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95d75e36d807763e650304f7c92babebbd4da6abd934115557f77c282fac49b8 +size 199058797 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d6e25f4dfcb6ab25d7559cf0a9191d4f59d9bfe --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b3f9f1b67a03c1c2ce3a2de1cc21be449dcabc5bbd55ad68af9bae7b3ef5302 +size 199058605 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6505cb9cef68e0221bc4067188769365b47d93ce --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d5ba2ff90fbcb03f7bdc0465e9435ec06ac4290e151c2ec91f95a7ba367ab4f +size 199058605 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d9889cb634474490042ece62d2591908e18d3b4 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98eea8e19e6335afed86d6357da143721418bc8ce182d9537c0d7d40e3db173f +size 199058669 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d89a717a2ed6b7b344f2f3ec667142245dcebcf2 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:528f73890af10b5191ee585a8c6e697a27d0fcd6bb877b064deec3c9464f665f +size 199058669 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be75f7c0b93eb7663caf6eea5c9132eecf3db0c0 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebf4954d935c76f99144e2a0d55f2ad9fbfe7d9c1fa14a7c4cf55a1ba150e925 +size 199058797 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d210d663520ed62cc19326b44c6d91d7d57d1d26 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43b17ce66a0d1a7892752abb90e730c009300a727e3c799e3f936ba4fc1ac553 +size 199058797 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35a6ca2da503a42c57ce02cb34ccf25af940ce8c --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a001f6b866a15ae8e585d7d83e0051a7dd48dfb7fdf300fb326a94c0b18495cf +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10dcb0b428089d5c5b3c30aaf6dca8ddf8cf92f2 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ee46d138856c925923d903d033c1a697db8b214b1cd5e53028f28e08e3c2114 +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9d4734cf8bc53a2ceb27d7b9593fa63163bf4c1 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56ad43b4bec7ac3694e4bdfccefc0faabe68e5a83f14296c0f0be9ad9df6efd6 +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7afc3343f539db69c5c3cdfd0b43126717e6c54e --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fb9e1d083c847924f770dbdcf07ed94a5fd2c5ec74c93ea12b74fac4ba430d1 +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea7a34159c4abdefcb8032e9223a0779112c1351 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54de7411820ff7a763027e70ee3fec635bd8145d950c051ecdb6556edc5e4967 +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab56fc64e243ec980ae05e1c9da1076ef09d97f8 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65423035749ff37ac7b7c085f7a4040ed1da2610c31116bc0a22d894c9ed9bef +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0eecea9370b11b4e839c33dc60ad116f239c5834 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10c1a6350d31923c2eb6cc9607ce9bbc41c80fbec084618c9f2288ca57e8835e +size 199058797 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a708f51237fb8012bb695b9caac67315f3942571 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:703f556e0e518c9a551753e3193e566a7fdcd31ff6c777d0d4f9c15cb613e7be +size 199058797 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5eb26a42c63836ddb2dfb56e7432d0a5d048fd13 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eea6a3dfc082e74b419eabe72639ab6e30bd64fbe31ac1dba3f05affd1643150 +size 199058669 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca8de80af6ff3b08b01a5a17285c31cfe27a8463 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e64bfeae45a3607ec36df7ebdf8920b38074785878d6af2932b3370948700f81 +size 199058669 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a704f296647f54a3cc18273adf06ff0cb7f3093 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d07450a09edf6966f5f7c95586f19f59f75f14d53695f60fa08578a19b9f3658 +size 199058850 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a18621f6860dda1a2007a91c68c0478e2137e008 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45d9f784eac91b853c37aa9ce4c59fed3e392c358c1bd9595bc9f6a9a815fe3e +size 199058850 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1259e58d4c414c09b49a4bfa5db2aa35773016f6 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a080475fc8082b110c2db102fed2160ebae75cd85c41a40bf10622127c5fb421 +size 199058669 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb0714a07e66297689afce06f12af81be430527d --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47f977b3c7b947c3375b4d6fd963e589ed8615fd11c7f4a1abfe528ebcd92173 +size 199058669 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..800f7558846b4df849e1cfcdb950da4904cf1ae9 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c3b803b782ce7b0065dff325e3326f7440549f71504d989613db9f17ccd1e08 +size 199058797 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00ce7b4ce06905e973e01d27b60e27de52f3ddaa --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f67631fa024ede83f27b6f88f859233110bb8e7e0380b841a310903530d0b885 +size 199058797 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dddd67b5ce455d1760729f1e7174d0b30142e992 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cc80344fb95c06620d2686ee71cbe59d9fab918502b01211fedde5fbbd31170 +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b62b695258e2a38d43b4fa324a59a824d900a952 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da4e848f6b6115d149fd2728b6bea577631fb916e7c5c99897322bbdcf159010 +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f3d7c826ec236e6948a3966a2c827fe921b8c3b --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3001e48426e13b25e9ce6e5f36ed75676ca80bb0aae861e7b6d9a6a2762a79b8 +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..736ebfad3df1e002fad0e8ed1e1dadb9b4739de4 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e81cc2b3f02bad12f1ad7b328a9f626d61a0f58c558b56e30c3c9c1e8ac6a0b +size 199058733 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..804228f53a1c47b7784cad4a2f43d9641a00ca30 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cae617378b15c41c99c2623ce42e1c5579fc7a0fe781e64666f5ef4a34ef088e +size 199058669 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9815b113ebbcefb8a9661968e88f0df54a534d1c --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:348f6bed60919d768e156dcc1d49444f5144705827aa5074a453f27555e0f99c +size 199058669 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5590a3f6a3e28635f65b2acc5aa67c6e95e13d8c --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85a8148189afc8651137af9b245f8cf7520f5d2724058483d41bdd8b13b48e35 +size 199058925 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3951c1be619862e1cb92b5e74af02210881f0d8 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25c197ed9f1cb1d36591f033fbba932dec1922a6b12d8e48028727f301a066dd +size 199058925 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5094cde487e469bc099086917c3db9e8be59925a --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59807bc9e9e81964fd861b55e8f514ec123c6f06e1370a340c7bb5e2d2e33822 +size 199058605 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80267a5b61630650740b747f306e3ea7984b2371 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b33fd8488636ba045dd280af0421426a088b4b77a05c050b98dc21dbc6e8210 +size 199058605 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfec0361a0b14265ea52f669256612003d652920 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b68874a11403890d7b8e5f18669438d516fb92828736193fd9a3c0931c0b23f +size 199058605 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1df86a73d57d88bcf241c752234e44e932295d4b --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:923a2c97da47c74f6e7809a20cdda81a6e34482bdb5e6133adec9d380da45890 +size 199058605 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd36614e186e21fd2f4248e78f02613fb40ff6a9 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40cd7aebfabb0885ece2c25acffd646a5e0d8b8a9b05653fd4e32583ca3f601e +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46369da709db918b86974141e0349088640829ea --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05a09560aaa6ed57efec12dd09be2bfb71b4b20ef1236f60a9737f04dc872d8a +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b5d32dedebe3165eab3808fb5fcee0902706f52 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b5c0d495baa0d4c44cca336754ee7246fb83e313086d16c75742a51eb0e062a +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2e265f90e56a8d74db21518a9673998bffc1fbc --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c23e35ff4c3244f64f3f971075f2d1b8446b08d00c3575b5fec3955dedf8715 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d6a4a592458036439e70b47af1b21b5713e2c86 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bede2923b680305ad7e0b7d2a83039337ccf24c9ad1162c9a223d6bd05a43cb +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69a0fc22ee6bef135a30ae93cde044aa63648b1b --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b7c58b2b0b123ba8424db20d30948e15290c4c6d45a87190d5567aea42338bb +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c24de5f27017bb844efc605955b8b462c96b2c02 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bda3a15ecaa000a87ea88b13fdc431819629e16c037a3c1f8366476f9ed68ac7 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e24061cf6dc8ad3d83fffd177843434d9c204186 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e622209ba2f65429650a1f8e18b5336320beca7033c6f818e1b5f44022ba1233 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3e1e3e4e587f92cb10fe6e68f17aa919ea725fe --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f647566684707d0efc8566d3241040a3e688123ba32e2ab587ef3f6def214687 +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dade5794965e831efc0ac6e7b5a5e8e5936d58c --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c236bf4f398f9fb0a83c0ceced86aef49876d8b4fceaed1cf83fd428ba4b45e9 +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f045bbbff762cc14ded9cf542c0a703cccbedaf8 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1829ee89ac9095658db8c3fee5690930768e0888603acc758c212d506b22108 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20294b59424295b43c2d5e3129afe6f37f705b51 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c76f6118caf67293b95c27ac0b92188e669bb5b43fcdbeb99d3b0a4d0fe6edb +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c93bb4ca4ce115eb4689787c008ca073e10c1bfb --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f22b6974adb11d371a2eede607a0bef2030a4281166cec209c791b703971bee +size 199058978 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..782f584b1362e3a7f1e4cda4ec07535293cf1a24 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0122cd80200d89aaadf770c84d4e3f4bb42116e057bcbfd06eb3ea3edd271646 +size 199058978 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f48788663bdcb1ecabef3393fe2c4e91c26bfa62 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd8b84e202794cc59ed1528bb5c8750cf25ac08bdce0483b0c039a551b23d82c +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1420f219b7e31d732f2cec923e778bdd11f3ec69 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19c94c8daa9d918e8be36dc528792a444179c8739dc64c6fbf1b9ad8df191b10 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2dd70d55ac04102fb3e78e22870673c58cce97c --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d8faa1797c69389ce0cb32b365d473c5a7cf7bd6950d1f73a1d16430c1cd073 +size 199058647 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3852433567415ca592f6709ce6c81a11aae9321 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00feaffc64d20b5dbd12226fb463d6c85e07888d06d23c6e6a271d5956f2a105 +size 199058647 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31d25cbe4891f0824194a4f2a8029295613ad1da --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7a2a8e5893542c2385e222504448d59bfba39f0eb42523a0d853fcb65bdd454 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbe5f26ed8ccbc6d8ed0846cba27e6e8140e4a90 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8d282c7a71d594d04b6921f51d39cf56a6b649aa11b24b8ac774b5fb2776f9f +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c57c483c1d089ed1fe68cdaa1f18882c8ff2af98 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64e35a4c486e2c73ccc127489fd8f68823122ff509b43f644458cd50f16cbc80 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e38d47ca0454225425fdd36d4dc6572513facb8 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5c13c657da7b2567083905f7829740fb4597a31eef3fb10ef282ae914e2dc1f +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a32bf579cbc276453fc3e9a7d5e7541f5ecd765 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c01bf6a485da16077f2b4f0dc336711e2f20575e29b5914eb0659d620999043c +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bf7852f7494e6d13d848c0079dc791e9311ef86 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b58f682c6aa1eb27e19466971f6955eb4c0619f2e915501bda3b9fc83001b9a +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97e8e3b5f6a9857256d8b7165cbc025204161c1b --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55b101fce181209cc3b193b302f844cf6194caaa3f4d3fe7dcac45f66f03910d +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c32fa83ef0e395f5fb10793ff0973d74d7407ab --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d293fba5bc2a0af8ccee3e2b103d61fb0017b1693e2d5c424828c3b57d661ad +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc93c86dd87c357d09861ca7cc1a58edb8be4f53 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9985d45768a29ca67e875eeb75a1295b730ef7cf789f333ce7c64ac5bf9cc9d2 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63bcf976593137c7ee8baf79913a1fb13656f6df --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e59dd32709adcdbe7ac578bb501df7b6a6d049ab05e9b74f2fd980d16dd02005 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78e29eeffad9a7086ea3404222c9b8d82ab9c397 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7532c5314e7591b41bcda2cbc585d4f7c947dd25b6996332f32df8c2b02a4050 +size 199058850 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbf699f26414aae33587e966efb64cd76d95021e --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:133683ef47d78a346deeef55cfd2817e6b11f7920a0df13aca65f3f166b264c6 +size 199058850 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31e4ff1956b578719ade1ad6cc66d17ef2c27f1a --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a8f025a7b8e5403ef5863ca5e5fe11a913db43c9951fc12cb553552ae113141 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd5adcb64c6bac86e20125f221897da509dc3739 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa647cf44a650a623eb2300afc2a6f4eb9d826097846feed31ccc65be3c90f52 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0b392fb78fb3651341ec8e359b65d993ab075c7 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7da50769c0f6b6b94402f718c15e0a8f2784a1b1545f96e815b865b1eb191163 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3636f4bd613ee90696f676c8ba248689d15ed24 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbdfd13fbffb312fb149a057c04f5c1487257646e5f138afdcd9b72bc3bbf24e +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24e906499f1350f02ba2ea57214bbd6282ab15bd --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94b16ff6c0614e3f7a7d13843d52d1b6c00109dd28544fe83e1ab1f1e1861574 +size 199058594 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74a539440e26b3dc70a447d3ab91ed3d2ee8d7ee --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8619340583dd044bd73e343642899f2a86483bc2e9f1669b2b7a686f9d8d0639 +size 199058594 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4257df436019cacaa1b48a05f92db9911116f0b --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ac054cd038913d380b0f1ca178be1811c818af2c014389ac1cf613120143ef3 +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5f28289cf6f98a95564fe60b77bd18a7e30cf49 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:976255a71a23543f8d0463af5008b685867748481d8ab0c7388ed0b12c48061f +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..812fcc100e4338c853eb42d7b503fb46b556105f --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2e48d5da349dc986b2065e0f6dc8163458e6e94410da73b0f18b627862982db +size 199058711 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e41c84d4cbadc9b64caad4167ee661214052e1d --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bba1cac574f0201b1a9ebd88894a0ecebbcd123840d78606e9316f1476d08a7 +size 199058711 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da3e250f64194eb5345d2f44654f7826fb67753e --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c16d6f856a41f0a8f7bc9093f8c53ca3f6980487262dbb8a4372f6c6c38723d8 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a2817036ad9dec18cb3a07c3d7ce013113fd376 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5cd2a250963b022917f661b487c50edd89ea26978201c321a575c2e4273878d +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8f6278ee5d59f4bbbea84a768e0df7d40b0714a --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:416e7514a1aebb9e9c6c26c8c8ca74c49b885eddb9b8969f21c69cfc5dfe20e7 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d9c7d8c9acc6805fc7248d39949eca22cdc0542 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb4cb2a8c3a483a792fd0b15f79a397b1eff950d90ccad2a8baf68b10082eaae +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c19039426e17bbe34c684ba7768b902bbf89a6ed --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb88fa68a24337169c3eb25cb1239a9730b08fc50a6605d1255475a816dee76c +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c5e2bdc022fa12d187a7903e2d3041f3fe50f96 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5236a104989a6e8e35bb67179180c7a2ba1285f7d3babc7119420328df13e96 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3832a755029328cd01d6a5d9462db6429458de86 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a084d0a7c43a71c23b0b8388034711c1f317829b6184781ae1977ba75b0874be +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47e9dce0570c6cfbcd117d3be018c8e8efa89f86 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec850f40a792c5380c142c048e2383108c4e26cc7092d8dc01ac7e28e2aaeea6 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec5fb3ddea1945de667df5fedc1eab99b3e2c798 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:309ea9672354694031b89b7994a0f7dd85779986ba74d089610e4345ff75fb1d +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f777f4f80c3b0cb62981570f40725b35d3b86272 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cec58bcc86c9258b6ab8e0c2b5179e5bbc6ea382456883f57b9d6344605e47d5 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6a45a4db0442af13fad942b5a172555de0443c7 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1d7a92a0249e065edb257a708b58571bc2ddf9bfaad622975a6387d1d03e88c +size 199058594 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b63639b996426f450c4c8794c26d469f79d4050d --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d2277a3c734a48d43a6272e23e2f0c1a6cdc54ba31719b50ae6449b96b7ddb1 +size 199058594 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bcacf4c2ad7f1a2a6aea03d4583436bee29d253 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:608f3a5993ea23b42e0bb3885a1466082f1f8f76a870098aa2826b6b41960382 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95e18d1e87ca0838630354284f1d17fcfb1bee50 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:397742fbd2a19779a2530eb25e9680896287574d2f4376b367adb743d949197e +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5d7cc7922a7a7dd567de25a4ef1a892e1c00d1d --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f596ed922d070b06d4a54b02474e0c6196eb468699893e2aa662d0aa932ac5c +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bcf62c418dc873c6f0e3f50ae3737a60f6bcde4 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e96f92980b21419b26e3171369ec5eacc8c10c3a65d02463eebcdecd07f5502 +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6382f365665400abb1c4fb52bdbcb13bcf387905 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e170aaa031a1061fad71434889d60c6443fa8b1305f6790f741b7ef86180d8 +size 199058850 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d306bb634f3410c3650847b3311be8c9dc68afe --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0647adecd18900e84d59cb6a8002a70b814e354b3f01b0a852f2e3fc0172756 +size 199058850 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb1f73caf50c5132095fa786938870a94f53a9e7 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96b3ba965e79bc9dc530a349db662392c2fe5d199cdb4082e846409535ac90be +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7497611e36a8c8045ff96354d2a8aa0c44b52f1a --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a95b20bc917f4490a719ca082e221d216ab68ad67d32786e3ee79f0fbf08cc33 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..acfc07aa7696234050d062d1743a0366f7a42092 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc4ed7c1463f84d460358ae48a416d3d47368fb0cc695d25e8d8ac1d911226ca +size 199058647 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e606e1f5297882d499b5a71be2e6a420410b97d0 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4211939ebc259a52730b2e1a564f43171d2ab15d746244e116cad96a53ed9da9 +size 199058647 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53ea61d4568f420684ea6dd967c22d48d683d223 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63901a55d0cd28bd1b35b9f37680550bb843ca9fced522f3a2eb2035f985b40d +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2e5458aed3a8fcca3ec954d0bc97f0f9d63e88e --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4a4b02127f73193b2649c66eb0410185191c1f1a1309b411dc13e177728a38b +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bff0de7b89638ae2b38f9a89dde5f8acae65d37 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d713f70a1187dea87c3538c682131d0d07eecd8024863053a027e9dc47dedf8c +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46aed159601dd3987558006cf026c6d896d9746c --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3894a93907e2bf8a5fd320edb6e8883e3a01be48216f0f1fb68eb56d0024af59 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66e6a8424dfcfe950529c22039aaef56081360a3 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d102f48aaf2c2fb0b7beab65cd16f8450833dd6c9cb679b0a771f0adf64d2273 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef1fe381d795cb6a0f835ddaaed2b269c1fc176c --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51c0963ab5528e350c2dbf8a79ce1b5a88475fc7ee6ffcad9eb67233fff392e9 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ec2ae8dbc9bd314ccb8482b18e0b5b7c1187967 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:162058c3dc88360392658a3121c444ded817703b5d9e511415002e9d25676a16 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40d790d27b08a4970e8ce1f37c20b8ec91a44e8a --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67992bc14801d70440e9b688652c1f4def548c218182acaff2dbe58e767c8b9d +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba8747386863d3dfc46d8c8b8c992248f070ce99 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:465aa3febfae5fda91a12ad41d232b05d6b0bab5074ec2290051bb43a56ad209 +size 199058850 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d12d51358a045a6dd4b71a7a92c6d9c05fc22a56 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4575c1dabd3ca32b3ad393f9c13c1ca8268c4c483d1c42c3f61f77d86d94d950 +size 199058850 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..594dfaa3e8b024044fa607369c1c1c184180daf4 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9e479228e6597c68cedec5b8b63db50f52b5fbaa1f1a3bbe39cb4d08d4eab41 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c97822b3c2a95a40a3706b3daf506c967f423202 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57173eaef2e190f3e4e1431719329ca88330b09292f63beaa359a1baee9e5131 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e385aa4e89c42614c76ff1ecb35b6d57b1461598 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e08fe1aa742f0d4cddf4eaf50dd52647f6a6708891f552fef7e4b577409442ec +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c09789621843cb0302cfdae007f77fc8f61d957 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bab3d28cc50b790f9d59c7e6db17e69dc40c2a27501518c07d579d2fe90f3be +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04479288e781fe4f31e862c91dcd3456ccdcdee8 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01aff1ea7a8b2920e8d9aca1881a31e75b16744f8f47eaf75a699dd00362107a +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d38374a2ecff701239e8c5a204de35b6b5bbde7f --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f89988c765d7ff06ec9acdc9e8217c7c3ab9962e1e4f8050c5169f87603b68b7 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0535bf83b7b2241c8d15e6fbb4ca8c826f5f24da --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f38bd951757751034f908261be952b6779ca00f22c68febf778a436991f9f4f7 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18a0b383e0c0b6d86dac4a1f9ccd974ab7eee987 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edc856b643a6b1923ad30966e6122e9cf90572e8b6ee22fe839545bcea346688 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1179f0fe1f92d352d59dde2b73ad23021154655f --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:092f9c0ab217bee48009f30c7d1a8c8498a7ff28bea792f8a6d31fc7ff7c6977 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b0742defd60beee081baf5bf503bea5989f19ab --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52173a9358b3ad834caa6bd52b6d8e1d67eb68d044fd048fc5743657c3f08a26 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bab82e53f62c2edf94b06d3de5c86a16c7e22656 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fe67652e907649f0e82f972ec164f9a1a23de623fb737b4d4f9e4c35f592b1a +size 199058775 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c06a3d2830750e2bed3e81d45f82065e939275bf --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b633c442ba4165b10c995881a4aaa5d09cbf6d22e309ce678cca90dbe3882788 +size 199058775 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3c4b9b76e7b9e067ead7e46cc697b3d5b51d029 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df1aa1eb2033c39f24a782b3ce20149b0a6575666adeb9a71bfc5035a9f8e35a +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ca1858f68cea18aba2d9f4e21f795d9c75175b2 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f81ec74913b73738ac42eb52ad235038bafc26397fbd4fe1f599fbdd614a4b59 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3703bf388676e5d6593a21a6be1b80e030f94d67 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7249ec9bf7f85a6e3b750430f667b73f06e354c78d69772d313df8002125f0a1 +size 199058850 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e32cbd1ca54918e978fc8057054b2e8525221999 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b1cf8543cc6077eb74e23cffba1a6ed029c070feb5942566bbbc816d62a139c +size 199058850 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1ce4345b50f9f9e99af97d7db79c08a450421ee --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b473defd963ecd60b8d68b1a3b4ed81c4de667bd7ab147e60e05792fbd9bb22d +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8657d6dae1aa44773d06e2dd59c55e00874363f4 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:116707c196feca3174e8a94f6c2a2b5971c47df1736bef33c1b3e307d4019a5f +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99cc55d8641a29c225c06fb5691ff78dcc6a8ea5 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48165edb799c1caaaf1b1d386620e55855e007f650af3c520bb30789475a6076 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..558b2540cead75941322e2aaf814386670bb04b5 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fb36be1b0a96c325ca4eb8d1ca50a36db722b081377d42d2bd4d43b833ab0e8 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eeab55247c0c1375f56d8ede9396cd13c3ae0fc5 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c2a298de442ecbd7152b8c1b244416f4682f1189e5720891e1858cc765fc438 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e913d71bb71c5fe09eab2e5a47012871c7c1d094 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fd00e00599d7ed152afef9a258c78b08b378a5f7dfd823cbe397a1fc51c5e88 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b057736627f4f5bb5ad103c6f31913376848182 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6133deb2d4ad155d0d8a0f09de482a8058ca20100ef48ed3be6c34fbc66f645 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19516df9e4c3848155209bf1496d02689f764b2a --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9df99eeff6ba1a5abb3b9c535090ea9ab4eebcb92285a3f8c8e4711fc8a2bffb +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2a6cb2452a2cee671323307d3029d189fa60f35 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84420a6c29bb3f536d647c5bbb4fb3f7ca0500b9d39a2497b293ea5a1f19d1d8 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..219842fdbaa14026c5a9e9b17b28d0b3f80e6b04 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77e7d45d08413e62eaac5ffaa9b1a1423cd5eba767b7bcae0e4333e02caf18d3 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..debce2e260e087f88b5458dd2e668543f17131f5 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeebedf8aa53d5da4146466ad484482ecfc4ff129431f74e14f7e6b2b9fe5af8 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7627bb07b9903b47d398e32e6f4ad65ac622f28 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c925b2f17cda7e968a3756a722a0080509d523199d8ac0744e6d2b889d5cb1b4 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5126aa29418c5148b78708184b1889795aeef8b5 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:308ca2d5701df5408f86b06ff7b58d697d592fb1fb59fd4f8c3eeef7eae51a50 +size 199058914 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11505901d2a3079a62e92d2f7e1c9bf7866bd8c0 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3be0dc9c2b29bd2d8087953140793ac5d5cdabc461bf79fa674b857f5261ea42 +size 199058914 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd4960372915def1b3820a9d8ae09b90675ae334 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb2808ddfac51ab8b7dddc55c2b39bceef87e73957c0a87bef0dee89580904fc +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5048100e9a199f1b7b4a10b97c7d2e1043236080 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b34bdd03e2a6d49d94b44c0dddd66a17c13675aac7c540c548aad106297957ca +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f39ae49c6fe4f65a0447ddbe2b192cbe6bd7469 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ce1e9ce6f2621fca6de80cc718d24edb94c9accc1d169652e4c2d7039bc8dc0 +size 199058711 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55775d3a411e44f72967fca0a12929982df2d830 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdb08c0a80cc7504253b7e297dfcdc770ce1cb6f91c913aacfe0219bfc90892f +size 199058711 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..887390607be72c0bb66ca497bc97bb1ba3e60c2f --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeda20f51fb7fd8903aad2c443600e3d44f899ad2bfad24cc1e63b1fcdcc0e09 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f66c5ad68e53483bc5b5938fe5aa17c03af2334a --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:701fed8b7247c255fa31e5e4c46f7725f59ab881c5103729a74dd144064e6201 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6867e8381c267a36cf8b2d02ec2d50c8a082925 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6459c95863098f00ff109640bdfe054714bc29c8b5438ac0b6596f5aaf793434 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ee7900c7851b79b3eee80f56e591292ae7d1a13 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98db1c80614bdb5ddc92a58e9ba698deb7971d4d92c0eed1243a6a23617efc02 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2777d2db413696201eea78bd0bfc6be2202b9e47 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2351013474fc1e2670ae58fc8c157013dcf812eac43f137d664355bb8050cd1 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3d894371350f31416fabf70d31fb5b01441f4fc --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c707c2e9c25abcf02804f25eb16f1c5c38ab4ffba2701f46eb0a6b8affe35e0 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38d7e97154913cb9ced86df007653d8a0d037453 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbefca736b888225b1f851dd78b3def34539e97a5546b72788adfcee84a7309c +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..098c6292a92ee8d89a5b1498ebb8761de786814b --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12685a2c05e0be4a2896184e3bfdc956e988f2f0cb605ddaa2c9bcfcbe6579f4 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70d47c23dc719b934e8545e9c4e1b4831462f7a2 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94bc592ca1a6a594414007b6d9ced472662a1630513709b9ef6d61a8c795fc9c +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4381168493fda470b8b2b688198e827726629392 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1e4f323985204057cb4b8f3125167696ed9d2c0e7849adb253d41b6f820010f +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34917a3916a639448979835f7b4cff51675d49fe --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f09587db69b7a48a2f338c11957fa1ba698c2f802299f7fa0432d3a6f69162a9 +size 199058850 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dfc0af280f86b23d9d980cb93721e93ed2156bd --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5656c5dda579a3dfe4d98c8f6a69268174bc2e5982b5374aa29a1ae79c8eddb +size 199058850 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f97f39ed0ceb60a8c59876a9d4e0bc3b5c370383 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dd07cc670071bfb001252d1db300e108ba462a69866f4e697b203cf33ebc82f +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be5bb729c1dd9c5f4b9a85c0ecd078bea6bb6369 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c65e7b31d4da31a72ebe73fd265188aca8f835e91254d2c2abc556cee803428 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e02b3849deafa879838d5ce28440996fe53685c --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fed259e55e4825a0a2b5a006da01b3ad5342b51e4fa04a1b7b81521dfcec6f5 +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..825cbb1ca6b030ea03cd7399a1a8cf8f9741beb4 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aea12b4a4de4348e88d76aa8b57a7994b61320e76a79f12a70f1dc2a22e171d8 +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc73c65a94617e1c38bbfc5bf29ff366c74647f0 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b904e0ac04e72cc9e7188c743ae206dd7aec8cb417f13cb342a5091e76b906c5 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0a7d60542eed1b2aa9d7ad2fe990b3ebfbf5753 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f53c02e159a2a7afca6027d9ddf20ece857009e2780847faa25757e8428b65d3 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c887d37c9da6a9815f96b09a8ad3e41bc7a1d16 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:289548bb8c3698bdabffecfc40edd047641eab00a69d1629492c565aa1b01ce0 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7589092a9de745c191ae3629e8d725c88894bbbb --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b999b3098f0dabcf5b14fbc0d6b8561b3c1f22933fd4c035c141711fb61b38b5 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e7017e3eed86ffe36e3ab2994f3a95517070372 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:964c2fcdcc6b16c9eb2ad4db5850e877b290231d02f3e13e04458c7151a58eea +size 199058647 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..582b5be370a9886f15abb2786d68e805f425969c --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd849f17790eb548385dfce5a13a3eda3148743cb8188640bbbf9ee040435af7 +size 199058647 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a069bd6917a4426c9f7286434a6d05541b11a0e --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9a145665821e60b6493b52443fc063f267ac1aefe0817115ace908b4f9d1c75 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fa941db437239c77559118280ae60b852760879 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a56e20238343ca5b0485ed6cf432ae15586e7716f2fe0f9a0d6f8e620560f0fe +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59850924d1d90e7794701437f2aa5cb5fef0046f --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e467050251056d29169b1ea192eda5644a944d900c63c8a0b52d2cc6990b0e1e +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..521bc896e98821ef11ee241021b7f02b86bd4643 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:991317b1ebfe41818d928a781cd33d44f06a1ec35b8e89a716a07c9bfecfee07 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33002351aae86a42b0510c4a6cda757d8d38809f --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7996d874a788f9efe8c8430080fe6c899df019893f132bee825d9bed4f8e12dc +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1dd6faa474b717bbc5ffe07f993a8715044cf99 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f6ed206ea6c512e71536003632555a7a205995d5e1d3d2d88aa79290192569e +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..947d58da5ab05012b51499cc9eab7301ad4c8cbc --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8846d3c10ad89d4226ed25c59445d047ec18cf8c3ac89fa3201e17e91de001f +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e6cff5cdf2c69eb9bde85dc935aa105cf3d8be7 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5754db14310e8c710d48ff008b755eb9a2c88ae1b7bd0b0cb48684318f6c9417 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e25ed6fe8c6b6d81fd013ec1e1c687dee16a538 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52b45938964b62da72e01d271479d552a58b157b791bcba91b3cc817fb67bf1e +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7bfd94c670e2f91ebeddca430ce7f1c328de7c5 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:678481791d2b2ce8f49a88d98b135c059ddb2ae70832afcf82929dbe6721908f +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ede2e904c9e9a4204b8e98cf888fb4711c23a70 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a41137efa667e1af26566ad1dd4052193481fd6dc6ab21a042dfdd3d8235bc73 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05dc11de9209da9156d04852ca1320c9af614aa2 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f3c761603976ed77891ca36d3bba47b51928af94799652f01f9ac4baf5203ed +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3a5c48265e0019250682316a8e9d40f3b6ee01e --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddcdeef5c400a5952d7e6e6f1b82f9eb1a7b35a7a70c46e409178d35f585b04f +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d03808fa2eb19d2cb2885e5edc4f403d452a6753 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bece7f4c821cb7fa286b5c9a49714d1ae3252eb9a1bf0d4108a12d44a11ce7e7 +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0b20f35d0d07221e5c84ee166aba56bcce8713a --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f5b447ef7a028a11fb99c3920e98e0890b85351cd1f7d7bd5895f4bae0f1496 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..499bc5c9374f8967551f9a254c284cd5febdda43 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d54d6ddc9d167369ede44a35ffe6a729a56ec0c548b96b68fc0ee81b753b8ff +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bb5abd7b64581e33ec54e821e4d2e4f811dba20 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23b948782c5725c93a4dc098dc8999ac31af27ce6894d2916b68043a0dc5f7df +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37392f8ea81df5481d8dd4ce7a24dfbb9758664b --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13ee58047af840dfd92d7be3c57875746a6118b724e52685aba71eff8c1b826c +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ae07ca443f75f338e1d7618e78b47663e5a7399 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e66667fb9ff5324deefc5372303ae9679dceb65ff1ed21489a7839f38fc898d +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bea2dd666d24f591c54c9d339f2ed936da443cb --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5cd7439db176c52769f51ea2ca47e4ebfe38f7c4f7b56f4f0237473df5db20d +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71550e47164e44dcf4209e3df0d8259c3a9dd9e6 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:042305f5d907743490265e7c643d08f68d602997664b7a5e7a0eb4847b70bd67 +size 199058647 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f40931766ea00f82f7f016833c19e0e8eef5e11e --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbc541a56815546a7f69ce3e074b11ce4acba41cf6d41dc4fae8d70029302041 +size 199058647 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd97276dfd8edad4d1ce188c1ad5e425c588992c --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5d2c1382d0a1b551cbd35e67aac1cae648ea268e807f7248d5073d781e4ea7f +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6fc38b8c4e5675c99b645e43c69adba1c0c8640 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1a5ef4421b829961e0494431722354880c7b315419fdac50c07f1b09aa6de2f +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93ae8240645caace7d2eee16d4344967d7ab5b0a --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6abcf6c285e070944d985cfca4919943afe65e18c1994f1603782f1bafd56b8c +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e89b68ef440b1510ab723f23682fa975302fe26e --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adf770163c631431ae18d203e8762a604df6edae165e7247db2709d63f047d34 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97894f965130495ba80ad7bee5d556e0b73efd4b --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b89e744758887f9219cfea418640d9937e4dbb88f8e3c7a7e456fe52387595d3 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94988207f8e327f0185ac8d6be6c9b0ee75de39f --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c482e9e80debcf9c5d1289a66263e96eb891488692e183e1b7e690e5f6e4b497 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebaeb5e96aea375368c1ccd37577b050aa457b99 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f049e3b4669a8e3b2ee5907208b0b0a9ab4da3aa54cb1f3802bb19e2871629a4 +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5acc1f703eac1c3607b7c254b87d5b9635a8e9c5 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dbbb19b3aad3113ea95e22aa049b988f9f6b18c63cf61c040f5c125ed30d2f6 +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c200040f2bf654f7474ea80d06b6317bf0d044a5 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf708401d86f0b6ccb453d4b70fb7e017e1c77b7af5bb64a9a384980b4149f62 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6286a0172e6f8f25fe7c15695344a6dde56613d8 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:656a282cd75162dcbe86da5929c5fcd968814eca945dcb0676b216419e53238d +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98c20a7b56f7c18ccea7df63a82ccc5357167dc3 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a6da82fa409ec82d38edf6489579f31df416f3e03ac6b8fa75da78cd8d585fa +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a4872212fd30db6e45850c800eb1f498eba79ea --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d8ad5497f3ca55fef946babb6e247da9e8ef347e6a2478bd6dfb7fdac7e8a29 +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c0b146260808e56145875904255481c400cb73d --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b19747268433007dddc9045976a96f79ecf7cd26b5d6bf14ccb3fc01467c56b +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20949674d359681acad8846b167f51dd5ea17283 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da350830f21fabf9d7066997ea4eba1c8a021d7defad41db29157215ef84e952 +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0807789f8cb16654ef7d2a335460690ffa840779 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d48e0c8fbdbcc44fceace37efb3e060e129c83ac2e2827f9c807d79bdd20c5c1 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49d8b2a63ec6b0f7d777187c349080ba69d403a0 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af6d6d7161f0b0e912eea3f414a9e777842572f76b248f03679efccbd1de2819 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0cc0ed714f607bda9cd1946a4b61d7f62313e6b --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33005f700ce1680296db2e6887def65aa6cf01f6db76a5117880a354712f27c4 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b0df7409c56221fff4436d0e845f4c4504f5e5a --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7493eb1327b5a16e2f328fb75298c8271e332aab24d3d4baaa22fe7d26bd4db +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93e476316e4053721995f38ee9adb79e15ef2aa5 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:198112366d6818ceec7e7638fee793546296fbc8f0e9123f9eda5830e600519b +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1306c43d3092c2e17d0e302267420d8d7c42f77c --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1e899b408309a4af8adbbf37a83be01193f909564a0cd2605442a3182d99b30 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d47f688abcd92035668a0efd3cb1d459b78b6d7d --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9081a36d3292eeddd587a16504bc0d71773e19fba24b2eeb6c28a74337fa82de +size 199058647 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40476142621e5c7fb9169e2ac9aa1595e21788d9 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fa4e302737711e5b742d642c4faa28e509e8b54a0539efdd24b4a918088ba70 +size 199058647 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95b15ff4f2f6133c695bc989950c1765444e5391 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e0f7b6cbc8e64d16119005cb6b0ed2621d821422e3dd4df1c5f8418a02a2be9 +size 199058850 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8069261d72774f85f68cdf5abc09c2536c11091a --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88ccceec3fbcdf07b62c27daab8a3feb97028c016b090dc062ff7207ee180aa1 +size 199058850 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b05dd38546668bea531f868ee893f6d5d47363db --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:725c386de551e0629619e5b580faa01286723f20a80faaf0aee92588cd65f819 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75d7bb97758693b37696267ef95a507fe7078255 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abe180e2fc4a99bcfb51d31a84c8c936d573baf28dc7679238b4c9e507f179b7 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f336578d8bc495ceeb221192354035d3e9cedfc --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c21aef273fb448394b6267fe5ed9e01eb356384aa6f936f79e2d1accc41225e +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..396b47f126009d244df39c455c2d9da5d3767113 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cfd64e8b9a54d0b2e972d8795f418c198260aeb0c78be389092aa4e0662d1e0 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45220366fd083184b178f3db9fb9006690770ca1 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbb6b06e54dcdeb4caa5bc1b470a40a5710ac65e7359728320255edc2e4a6657 +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40a5bfaa7b470ae879c2c3530dc1a3302c5f285f --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c7da91299680e1bf67cc2e7369afbe848a4559cc7b106fa55d161fdf5ef4d01 +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0611b03268a78ab65c5b6aa4f52c024ccb332e9b --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbb6b459742b9501efaf72ab86efa201bd751b0d9d03c06751c5aff866fd0c2f +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..364793619edc4ce0fa70a0466c85913426839958 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:660bd71445f36a7387bbbf623727fdb6091d67f780cf4e133956add8c3ac578e +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5f9904c3c37385c881ac1b91b3218d80301260a --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4287e77eb57efbbdd2663b5f3e669f4b5259647125f2120a104b8759961ff4c +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbf27fb1171e99c8566437d0d27078b3e5f2fbe5 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b1990bdfc01b71373cd8b61d89dedbdfbad5fcac8ca71d27ae982eb750f759e +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..358836dd1a43d9f144748a970a5946fbf123f07f --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d91f0ff964b395173303384f196e10110350d9da330104da1eaa25556ab9d694 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7759e8a11e1150a8c2091fe34b8ebc17e18c88f --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f6008b67afa6c6b43b93ba0dbe0c5e766b4e2aa1aaea8747cd3535f25a60f79 +size 199058722 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04b58b1ad98373d659b8f9fee903d99f2a66f3e1 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47e8aa44b7e2d41b65be3404d00cb74d411367f9c11da61c09ce79d5edb18876 +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1741d0b7594d3b124c3def9a423a3fe065c3f824 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b57cc97e3921c76c694f7e6cdc7bca3ea9c5cf68b17f934fbb515f2b3837323d +size 199058786 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf105fb7b1f08339120910f8f50b4bea4da0b483 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac180436518ee685eaa3b7c53844c5a3e64dccfbe4852b98f296f0b763124899 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a73f5789af051075ee996d52bb1b155504cfa2a --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6614b711118b4d1c7fa63385bfbcc5adeaee0aefcc4f2974104fc33f8e3d624b +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c343543684a549fba37dd1ca482312c17d6984d --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77fa426563ea7b774d0474ae4a3ae4a3a20707a03912919493dcad1cc6c4ac21 +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..165ea635d8b85812bfc8ca0bb8affdc9337c6838 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eed85a92987f2d7b5d2bda47b19d56151d40c039b8c0aaabaca8b47e54fc00c +size 199058658 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..545c155ef8f28918cd7307c487265fd7e26d5c08 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e556b0c997cd0d857553c34e24bd7072a9d5061c38850768ea455c4d93da0561 +size 199058839 diff --git a/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b7dcbd66a06cdcd8a35a8ff112d400b74f93987 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43e6b1f0472a4c2e1955fa95b634bd881c4f52ed1d47522d92abb25ab2b729c4 +size 199058839 diff --git a/4b284b21bc4seed1/global_step80108/layer_01-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a5f698ddabe0cd409a5fdb04896da160b2454a4 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9bce4ef9d7d8d69603f97ee8f6ab4e8833617adcf0e859352caa586dec3c6ed +size 167511299 diff --git a/4b284b21bc4seed1/global_step80108/layer_01-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13f9eaf5be55cb46b3acbe023b8b7cbe20db5195 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0111012ce4a59be21f4c3866f971d069cd9d66f183844c519c8d261ff793a7c +size 167511299 diff --git a/4b284b21bc4seed1/global_step80108/layer_03-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..031afaef5dc0f40dcd6b08db4f9e44cb4ffd82c9 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7c905a569a5221aba7618b4933bf4178672d2cb7bfabe1c2085c210ae131572 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_03-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5016ad1e54f6a4231475e09c38d02ef8a670bed9 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0a181461b42535f0793d140cec53e92c8e9dc3af884fa6fa2b44a16764b31eb +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_04-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..186883f0ff994703f485f1ae41b8a015d8f026ea --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6322d081e42f379ee9ebb7b5af89d7c0edd10a9f245e1ab78e6774c37973779 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_04-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66ba29f5f9819701720f79fbbcc92cad71e26f94 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fad85058781b5f7c42fffbf1fe6ad54d8c2d097eceb011c68fc560ac2207fb53 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_05-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1027bedce3f7eacc1e5910768221ac9d5951382c --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ccc06fa5711319a0b4c74d8bd95cde46c530774ac1d77cf19e4c78d4255dd76 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_05-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb9acf8afc020d930d228f6bff94bda98ab35ac7 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b1107fed20d2cff9fe3ee1b7b975b9d4e8e704b0ff4ed16951c135ec83fd114 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_06-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d550b3746a444287f0e41dcdb395ea6a5d501c7 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5920bb26f9a7489269617d4a9c3956b527b8e7f03fc00fe95d9eeb17ea7fc4ed +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_06-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba7c82392da1d283092164983829adede2140ddb --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c3abcc51b69600b245f9bcc1b94094d48546792d96e89cdca6623b1d2751e8f +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_07-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a1bd2941c5747e0616c48fdd655055cc818910e --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:481eef8513c548ecc89a8f13ef5b59b8295a4ffd51b28fb7966ded7fa813e6ac +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_07-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc89312eb8b3744ddad564c9d59e0477ce343750 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17b55374ecb8c1e53685768911c4468a61c22bbc8d04df9b680364f6d6ff4ad4 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_08-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dff9178b4c55e3a44877e0de098c4697665c6f8d --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bad9d911af3f37227e6af5e9b7b49bc0b0051355182b336b3077f042beb9dbc +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_08-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8f2f32271e2e7953f4bacfa573df636df65f3e8 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c28ba1acbc074023f35f7869cf6187209dc26484e4c191806595ab5449938297 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_09-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6e50a714151540f3c1614fb473ad0fd023e8112 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6134f64584307bf8e2c867fcdff1c88445d212724ca48254f34657bba3505149 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_09-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39fb8012c8552885be757035bc1c04672c2a65fa --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd4542388bf0c70ea107104bcc7dda58f34829bfac4da917d2d423cd722f4a89 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_10-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e637d112aa758c64533cfcea6ae78dd4bf1f0bee --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c653f79addbf86502fe0d94d47232b5daaad9fd7f4dc2eb41a5e8bd0ed273fbe +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_10-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdd0a841a9e7e4844281c91b7ae5418e99bfb432 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4b10cf2b5571b1937d324a3058dc7c720574886a46affc186df7b0a7ece48dd +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_11-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a8b3fc7e0ff78ebd21a7b3401ba3c4b3cfc0ec9 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c731b4d95fbe2de9a5a1a44b56a3b8cefdd4ae4469a8ed24fa4df1a02d310d44 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_11-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd9804b6d3980056960f553e9a321d9d486e2400 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:502a0f37bb64dc051859ef524bdd350c81bdeb7817096c249a30eb0d1fc6ba78 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_12-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd2f0a65dcbb46ec0a2629e7326935e96569e9e2 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7467668750d77e3d4882bf902c211b3e427aaf23a323168c7bc0e368ab7683e6 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_12-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db03aabe2a631fd3fa8daf78216e2104b9cd2873 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cda00c43d4d0143b1fbcc0f4b00387515e70fa811f56f062112efcbc8d3ff20e +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_13-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..031d2b715672790d98ad953adfadf83283377388 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:722cd18aaa40434b6a1a7967911da69b8916f36a8a6cfe66e7cf7bf61da5692c +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_13-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebd3d86844a93987230a68a1dc54eb68788f1c16 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fbd5733031b72a41e5a613f7be9305b68abec6652f88d51147bb06c7366d1db +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_14-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aefacd7b5cca2a0cbc2cf087fd7a0939f720b1fd --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77fdfb5229828fa507c9097ba88a2b4eca5707a459549c821dcc786eb79c790d +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_14-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..243a6e7dd8776a6b02b03e9c108dda94ba6e1ea3 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:458cf752d7166d8f6a107954b4d51be1ff0eecd0e60bac00491dae00001b2983 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_15-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d7a0530ce81e0d0d222e879a2976b5ba804f3d4 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7164f9e844fb75fe9c4158470f2c7dfb9d3508a883a2b14d2b67cf1f684ce71 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_15-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f3f407c4b6a74b30e5bf69a7a2c9896aa9c0c7d --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ba0f913227453bc73d066b352f832d8872012ae12e9ab8fd42c977dd92a3dae +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_16-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc380b7a679ac0fc0cd426bae730530139fa98ed --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52566c699e45733d3a3271b5aa345341d345c6b5deb1f701a537154dbabeef7f +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_16-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f2ab48da59c43b4e852e926870bb3d1341cf2e5 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad45baad281e579dd56652bd627626ef31bb010520b8ff2bd5b871e6e63cc420 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_17-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70f1ce16ae339594351f48d296b2d144e4c4a489 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6278445f46875cce2c0ccd2bc00fef96d3fadd9a43ba12faaa5daa55309cd27c +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_17-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02dc6386ff2b5904e93fcbaa422aaf1696e741eb --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfc8fb2e5c74b68cf353131bc21b8331279724d70a6218b1536b697d4d40adba +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_18-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4432792569590cdadd85ed02fd9069140ee31575 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2593c09bf7f5d3b3d780b38d893e26aec3b5818b2852e55fcf2670e597523245 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_18-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09d35e01bf0a5a8c4763facc1992f9859844fdd7 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a1b08d7aca8c3055b53aed41f799e2df4899837cd7cdc5ca51cce99549563fa +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_19-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..acbb1f0784969f26df407f6fd42e74138baedeca --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c546adce60bcccb3d9d44d74840fc418b850cddcd5354601bb7d3bab550ed517 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_19-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da6942ca310c617b8c4b3452d228981fa15b957b --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:857e7d8af09d8c6fb428209c62275005dfe7493b3a236aeaf47b71aba1c883c7 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_20-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04b06f40617add7b7cd14ea9d16105baa641ca13 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3374f355e46ab1246e61095070cb9d1843d3e4f4430daf075feb5dcda83653e1 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_20-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..290338ebf5ce90560439192afc3496bbecfb068c --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:715fc85b1b6ec3560f9824d3c2f0aa7345cf95aabaa652d3c7ac10debc37da03 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_21-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e647f7da802012fd8bfb88727b6604ed1374e8f7 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87c6831b67ece9bab4367d8b8beea7bae7d52f60dd9975dd353a88ebe1ef7830 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_21-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa65afad8a8a3881e4519e736c6c960506a5f265 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f35c28acc23bc18cd4439691d14a79ce643b9021f1e35c43202f67044394e40 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_22-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dab12d5d532146afa2df715c3eff258178005034 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af9ba3254cc51ee6f178bee08f9057c5d5a6816a339010d932614138a5835209 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_22-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f13a9d1af2e3dfb5b6594b8ded104b1dfafa32ba --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aa038f2b9c96317bf83ebcc617ffb9312ebd5ee49ad5f77506f9a088c4041ff +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_23-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..816671d1b6858e7c9c56e8d6ff3115cbe5d8baeb --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83b04acaa988163dfb3eccf5b557366296afafe3f56aa7410ba68c6218fcf8fc +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_23-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bef92860e4ecc48fb7c5d2b33965ef7023df6999 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19bcf0098306e60b5893273718169e1e7d18cad9e154546fad2b6d3217912cb1 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_24-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17a4a871058e69b84351db59db41dd39751a6daa --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4aec58bce5352b5d0a176167af51c3cbad92dc23bc30da89ba947b60ea5257f2 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_24-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f1d80f96eb8593fb569125e872735f481299dc0 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67f8b69ee1c6bdc773a977a5e6e21e07023a18d6d0e60b52c2dc3022ced14357 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_25-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9115564150722ee64bf7c43c7a6560b4e0818b2a --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fff8b2eda78d328baa4fc6fae4f9da52f190b3ab63ae1cbd00bb80f7ebaafe12 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_25-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf745d553ba04be71da7c0b25dbaf2ca57a931c0 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a02327c127c56528597a8c40467bbca4819bcd0da07f55be7bc405dd567de89b +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_26-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..418113569b9d8d40432dd534321dbabed4f325c6 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afdd6e1d3e9958f3da5f6adab90023f983ed68f90bc6ac2f395d27b60e5b488e +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_26-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d01ab692489c3c88ecbadb358b9337deb3478f0 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7844939c64fb146ab4bcddb3c304bf3d6e558b003ba276bc4a16f042c0b0c506 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_27-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31ceabc9c70cc5e9c0a2de455da59b12c6b896c7 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dd7a853ee63b0573247fd26287fe0cecd8867b7230755cc9ae95dca222ea83c +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_27-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da83450611393ae0f7e4e8e664a34bebc008e271 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9587197bd222c23e4c0856430ab641d8cce8cfda232de64326f96f3eb3de3102 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_28-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2897cd772ec0119f2e30395eef9f465488e31c82 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45964d85896af38cbf59055c4ba9a73a7d36b489daf49e64c6223165827019fc +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_28-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcf263013698b7b984aba8f4be9532016a0020a1 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26162b400dae36de9b0e70f02ccdfba192789c2efebec9a388db88d857ce2192 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_29-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a07718d3f3de000575c6a93d50cde5bffe8b25d0 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:973ad75900ce950ed12c91a99a3e66ad98229e355f36a782227bbe641c1729ff +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_29-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c56c2b573ce9abb1d15f316371b4a77ed28bc035 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2212fcdee572d7fb9b6b7ae58dedac5b2b32a60bc5965702dd055a8029d1b6a4 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_30-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0a5943d82987b3715a1fdba08177d7d9550ee45 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85c38ccf72de3c2dbdd6fd7eac084a95ad5cd12e9ebb3197fbbd4eeb57acbce2 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_30-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6563fc9d416de9a19db55811d09ee8dc9c64e67 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a23bb91ddb52dd83748e40d245c60e869e7234b950b9d980cf8b38a5365d1775 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_31-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b0f29f9f07480cd62935fe1b69a27e592d6d6e4 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2ea3dd503e45c39f5ef99ee6f29daa831f47c502e9cd7620ad33d5cebc43db9 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_31-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fadd2bd5afd11796000f4a2f6dc128c490fab4bb --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f602bef3b253592e5b3496cad0186869224f51ff3803e5dbb3c7026e843b90a4 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_32-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e52eed66ecb77cf263998852d2f77c2ed853cd17 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e43074430118789fddec3f449f5c01013b2526587a62deb95cf9b248cf09d821 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_32-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1163cfe792eaca51c871111963455e6128b03dba --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eda1d868ccd99786bdce3310436a4d32fd8a22b4b653e71f124f6f50d4119a1d +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_33-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bc3d08249684651d63809e2cffc34723081a172 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecfebfbbfad3c65913a0695c2faec0a3e05aea6bb6801b5a3ad97b992d05df99 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_33-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d91035c6c2d8a5a91889071db3064420262eac0 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf115a4a80d42ee8dcb15eb0536b5c1cb1ca7c41bd07c3769d9fc4545ca708cf +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_34-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b725534fe4e2963887a2de187acbf2abbd8b3bcc --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81bc77b768807ad13b805fde56607ef5bd2d9c0b7fab9f664d16c993b9d6af21 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_34-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79290318d3f1f993f430bbb9dff53d458ad386f3 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae0a0937d794e361735286e4f78b4f9511c17d7c5de87f1dd38be4104ec316c7 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_35-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..473650ced30a4f6dc79149fbf067d59ce4367e83 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:633c5b67b9e63df8c30a987ed14b0e07a78185e77cae3386ca929c076f2dd834 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_35-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae2842bb27797e8b8d87559557b3cc7fc99d8603 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ec9867b4ec07364d901ea1467d00f786e4c1f9a2983ef72975c9a6f062f7f65 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_36-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33e543f21751c34761092bc05a177a7c015b911d --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f0dfd74ccadf51acbda6949b5874ad2c756a60f8ba5ad58f7c0bc22dfd6d5e4 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_36-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44323ca315ff827f03d1f9d32e7b33edd5ffb5ec --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee409dffd1e462ff49fbef0cf6d5b9bc8774fafcbe0104c2bae4550d9f1268eb +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_37-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e720ef46684c171171d6f490f0ca5593e1816e63 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9634f0aff0ad7685b6be93a5d7e9a8842994257ae0f6097d6a9d45e5be8a4579 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_37-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a3a51ea374d19481069910e2b7339ca62689561 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2586d361a98dc21cbf5676d5d03703054e4aac0b4d1e4aa749845462b4c48bc0 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_38-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c246406feebd3328a61a89a779ff04042660e7e --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49c2f4e88b60749f13998af96f1577b8686dd2e9c0b48eb214424fc1794aaf9f +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_38-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a7c3307bc86f2afb5226419afaf10bf90fdedd4 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:993f0dd25f4170c83869494f127115a4ba02557f696b6cb71034c7839fe47b67 +size 113308931 diff --git a/4b284b21bc4seed1/global_step80108/layer_40-model_00-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fb28dad3532f3b495ffad22ed6d7c2137421898 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5416aa18180cd69e716dcdb2690e2d054873211b205b64ade14cb6b8efa089a7 +size 13507 diff --git a/4b284b21bc4seed1/global_step80108/layer_40-model_01-model_states.pt b/4b284b21bc4seed1/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97b8eee0e420da71a0a9bf2787fd8dabe0fc60c3 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44a1c7a574446afe07fb8e1556a3e8e6cb31d45cd67694a70ca92ca642f14ae8 +size 13507 diff --git a/4b284b21bc4seed1/global_step80108/mp_rank_00_model_states.pt b/4b284b21bc4seed1/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fd5c173d5f2794cd90edcb80eb26d47c8226d2e --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1d6319d7044c3023dfe5ae147848eab676e846ea9c9913aeff2607a48031904 +size 51507 diff --git a/4b284b21bc4seed1/global_step80108/mp_rank_01_model_states.pt b/4b284b21bc4seed1/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50b294bde832e9a43ed1e45ebdae58697c68dcc7 --- /dev/null +++ b/4b284b21bc4seed1/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6336187f61b53163ed0f34a7a086bedf9ec9b35c37b14ca74e9241da227c2bfe +size 51507 diff --git a/4b284b21bc4seed1/transformers/config.json b/4b284b21bc4seed1/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b21bc4seed1/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b21bc4seed1/transformers/pytorch_model.bin b/4b284b21bc4seed1/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..6a1959f982cc470088ce5f3d3b818629f0623660 --- /dev/null +++ b/4b284b21bc4seed1/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6df2f3d05f267174fe58ffbdf3398db89d32f0517af07ce72c327d93724bd9c4 +size 8781203669 diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..6faf19778134f274b6f7e629a433476790e71ec8 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.38535441961499517, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03552663485548509}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07392314530016614, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017416928662543226}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.31161026039179884, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0047814670849113125}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11065558909994337, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020016224462212732}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03387963683203527, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009418685192906572}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.15167229813850266, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003249849487394629}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.052101576521840554, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001254434060918415}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07143509621818969, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016292918867949191}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.30392322887986606, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004670559568432556}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10721119439428567, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001872014217214712}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.0707943641461647, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016472302036406458}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2986281388001843, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0045364052998747}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10596966360979974, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001881280054371966}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..406b8160b5d3cff71db4c3bf69f556e7952a8340 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5512129467367316, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0395418255366758}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.08196746460318716, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014754369831595647}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.40914147014095936, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0053861796031930845}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.1276921926781691, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018832476710271726}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03760548245806836, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008485772447386252}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.2004779256099399, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0039022297404803946}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05919617667381684, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012055006346489835}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07759729021254366, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013607454921227458}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.38809219654571864, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.005037385606363737}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.12093972964797003, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017235569265706195}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07790072285955618, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00140465482895153}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.38623053862621287, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004945962835138011}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.12119435037639528, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001776101552985325}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..3e23ad9f85ad6e1e76f4696b210cef919751dc5d --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5933018254177376, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.032599794867965604}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.08138207976281618, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001320028581758322}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.41969083219702635, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0051938217749552314}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12805421977747078, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017731859601500346}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03774533356166905, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008138836014742545}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.21183011597903806, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0039019044052842713}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05973961241278947, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011408079330925724}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07647361432812638, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001197053850440824}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3943345910974271, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004791104064669637}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.12034876582957013, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016107770822709627}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07733964505952771, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001246953646848645}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3972043924885929, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0047988833920575725}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.12158519620974508, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016694470344012931}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..c06f02ee8814057d20554b1c70fcf1bc0bc4590e --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6676820645573561, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.029698241159243657}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.08199443734871886, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013044083678416126}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4326296696301956, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005319027568329476}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12983004472435894, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017904512351955197}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03836456544897309, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008016019880007896}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.2182970907135364, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0039434390311428045}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.06110341345845585, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011495434475286368}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07660172161550755, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011750201739650409}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.4026463135770865, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004800741095877209}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.12124821447948028, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016083744034722292}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07783198204724436, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012330922500882204}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.40862496584299657, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004878219295388798}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.12313018758539385, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016863121667983272}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..97caef6dcb3ad015b03124fe987153cd692ec368 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6836151545167003, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.029089321693769803}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.08237641519365944, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012712811379550952}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4410392252234467, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005252924753314178}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.13090538213539582, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017570477742261594}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.038294697830682935, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007935145188603823}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.22196349128777046, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0039874400036358035}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.061203868765094024, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001147850507777741}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07647361824568906, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011522230823326422}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.40690715092516466, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0047151717706141886}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.12140909248039315, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00158909093789567}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07814715491035078, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012030810779768226}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.4163700311086396, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00483547149960936}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.12407530125753383, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016569917198277998}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..1ce9c8b5fd9aee52efc57a637a119aad04fab90f --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.770273022704267, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.034315297186777595}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.08203708357705593, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012436710783140608}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4527088578344478, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005270512909014665}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.13101067212098677, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017066218312728107}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03796634902700147, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007628000916252061}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.23182459931655927, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.004137297126449473}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.061162270106061005, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001104511682001034}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07531042150309193, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011067305255883584}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.41469386205754033, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004724284504576538}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.12018039624183414, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015114350444937687}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07740826323217029, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011667399100477348}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.426759509472668, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004893799458515002}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1235732065654381, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015991738579748697}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e7b8effe52fb07fb16c3ac35b52485dd2e260d66 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.15679162263674679, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019991369518845767}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2689745748726192, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029016224540331552}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.18416362480898446, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019831229958442082}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.03467120760519669, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008221744008462381}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06209758141565476, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015832249597357217}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04094718247147155, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009244238662338802}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.12082089693911753, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014097474863449463}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.2144029920856489, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002350903120057298}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.14338902877501125, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014226956074527863}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1433977232378843, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018222721919399013}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.24699886538862653, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026942999677837982}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1686525979999314, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018124703517444088}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.8921440063023223, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07135112924486753}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..3ba78b56df63f8002ad0bd5e7fa14c581a735fab --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.18997860617259896, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0021315131916909724}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.31970644615930655, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028665402668271315}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.22027730929537712, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019608589609497263}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.046578501178857534, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009806080013812627}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.08133508293170587, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017593067161220152}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05398367197056974, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010308834876363582}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1329141418602316, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014073779291519839}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.23157078499816725, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002239708119405446}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15563014047034032, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013088183409122065}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1786247909527116, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020029209788265186}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.3014126188767162, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027138736966177968}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.2072131798418733, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018385432787880404}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.8056438776711543, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0837473028373607}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..0b6183cb38664226d7ac5e386bcdc737b2bb5097 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.19848212426092088, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0023139570614517783}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.31608172323314615, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027622954997235665}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.22219895534581124, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019115852755068978}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.049990983654620055, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011071845883649219}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.08099563488003071, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017279951131225705}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05522229843864866, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010366643780952015}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1388108427148649, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016626769142365268}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.22710405861686703, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022002521830572098}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15589253405198344, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012973150218916173}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.18757113799557207, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0021914037253074584}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2994878980311641, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026463012724863054}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.2100590256285955, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018001298788378707}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.9780392590967417, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07485005723665485}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..3dc3345e702dd9ca396a6a702aada6d0a9f30a0a --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.17134837432784916, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002648910653676966}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.25800000600290435, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003313810821871368}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.18197691858961074, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002206594668965237}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.04161503586356084, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011270454940689701}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06562904781876294, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016912238278118353}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.044357885260241585, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009768044123671569}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.12351815672543218, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002041531952456252}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.18830813752138773, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025923821492611896}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13010623261113158, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015513282273767694}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.16212518594924535, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0025194852893668154}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.24439649503938565, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0031617457131678586}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.17213683153876608, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020822081122974664}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.847512210211642, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08130288880844025}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..e6153752ffe5d4277cc333cee88be7c9ef415abb --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.05513001019844826, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00215178654051168}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.08454226315750968, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002935250128250436}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.057107296289159025, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019494380017288225}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.013800421209577515, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000858478532665541}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.021959372595934164, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001194364786706014}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.014135921586219569, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0006914493317450905}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.04128275764961394, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016823042515051513}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.0637605084786262, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022692310247988275}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.04216170229604133, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014236179778487777}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.051975929888249256, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002028731950450667}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.07986443919003557, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027755366306270973}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.05379079735955767, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018282128528245283}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.6551089372553552, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04895444931980532}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..4d7a50ba5cf6c22399cfb912fcb50479c40b0972 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.009676230361373621, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0010092112696239383}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.014009287778858652, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0013693091057835286}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.009311675141314384, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008747369590243084}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.002516778405932201, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0003813647101277748}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.004189787625575326, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0006261364681498638}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.002405387772695905, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00030042578765582695}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.007375708880019688, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0007995038887537955}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.010624417220719972, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0010701965664864565}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.006932807281073693, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006486704498845653}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.009118809831121096, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0009682743549182715}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.01302829985395723, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0012830127121259097}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.008662236702193958, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0008161476026799892}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 9.282109221159003e-07, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 2.2223612520502284e-06}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e0ced0af64164dc6f190cae356d6b7e5bd4fb534 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 0.6114974539510816, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04527113203185075}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.05869533205508546, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001497949313805969}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.03571922348667764, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0013948024749901261}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.03492593073320387, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0010376513872745155}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.004063213985026975, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0003541545577591494}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.006573047412918524, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0005456263764429907}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.004517028931517297, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00036439768835932237}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.05805625987920658, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014726688390761706}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.03532952206585685, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0013716820040930184}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.03456601494605734, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0010229273732960667}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.057416666705387066, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001471227198507916}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.033493295914568566, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0012685265746055889}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.033356146432655866, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0009612249675140079}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..88b9165ecc5cb8865d6d94a104fd55f8aa20f658 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.33447911090928, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.14535102796873467}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5083802018676299, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032791833916447554}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.42190893586204214, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002971819042737358}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.433797396683994, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022987607409721217}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.23512517549601986, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0025920962511690763}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.19142011398550732, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021166855984481392}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.19719568941249035, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019377495452543357}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.37102243518103833, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002904005844748298}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.30457624020087987, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024007135826919603}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.31401062106699107, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019834092080858665}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.41705381489741356, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003122960946648587}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.34480646003082416, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027214625950243783}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3549188128484648, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002246841679471083}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..1ee80233677a8680729369575d01d2357a3eb93d --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.915730606248113, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.20474125011289426}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5479863902027133, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032369184668208516}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.441447062617084, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029152320911209556}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4631809810602233, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002254496022709034}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2694942093855683, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002668904008037024}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2131243378825482, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021529009824731303}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.22387083492928028, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019825042986668373}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4057365701684737, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029348734509084765}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3240876063453124, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002423564725696539}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.34081459166299144, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002030967494387809}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.45419008644409004, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031526651706947012}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3644738218767085, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027027920241602162}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.382975161960982, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022658855724966864}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..c54665744488fb4fc8dc7ab77f74900cc695b065 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.799049670661745, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1818766642053644}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5538154552713349, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032031754343585057}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4530213630135714, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002889071639596583}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4733021068886725, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002229748270982301}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2776711960124572, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002669354319886314}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.22402395817155157, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022252252780088967}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.23393615456741612, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020284322092199397}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4112498098162674, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002912753431059431}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.33431398302211607, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024572409829041286}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.34984277963163096, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020650055785518843}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.46138958037109395, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031283915205367083}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.37645205860452513, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027190821967377665}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3937728879658398, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022887568890525446}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..914c4261fe8f6cd437b21b40345927244ed45a90 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.332946979780699, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.187321161876581}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5502767036745366, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032191855076160905}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4601167935637563, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002933097976024252}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.47698101030399137, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002304125507421037}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2764817164388747, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002683961252587485}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.22893953263224417, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002301850243468405}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.23686616389681567, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020891392412113624}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4088077687087317, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029284110175963112}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.34034029264854043, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002546438349753808}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.35299999087704836, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002138766539340371}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.46022437266752997, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031504453494794983}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.38497978756866746, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00282067010132265}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3988932621808988, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002365288784954707}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..499246932801f857522cf5d208a9313dccd9fb4c --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.123246792588205, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.18981316484333496}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5508575470527967, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003172543361692212}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4596250362933734, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028838674948470076}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4771521080848, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002247583418148515}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.27785561114819307, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026789931891456594}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.22893900538597906, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002250810965306422}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.23757613806327457, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020631855681245196}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4128922710964347, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029408076764540847}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3432096183345724, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025317938331892898}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.35646844538814754, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002140481161608752}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.46456472542175714, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031248622936883626}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3874763961501519, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027737834865428587}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4021976919673297, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023234845320029575}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_gem_xsum_article_DOC_summary_0.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..a92899a45ef4345b22bbf403dddb5a66ad946553 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.15967577438396582, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002367262573167645}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3344097957704383, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004542927765114456}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.20731019337768042, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026329404650807355}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03607001702892568, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001380428573706143}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.08085696005427423, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0028599271086292063}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04779740432400501, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0016427567157124747}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.12124210013250766, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0018353599935403793}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.25607740438919824, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0036003883952627205}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1576331231529663, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019951539963787477}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.1242181328811872, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0019619556407432866}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.26337373173306655, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004025744770152854}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.16181781523790845, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022319416867268445}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.949120361010708, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0913394024073436}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_gem_xsum_article_DOC_summary_1.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..f96ad514baf856bee2fd7eb03a9de10df5a8b44b --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12169091971501833, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018485062787122516}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2985653730389386, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004290053847052186}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17081587570763854, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002498720216403539}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02579297493046093, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010284490730061247}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06657394965502363, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0027184784375237805}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03675651772088566, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014655540573612757}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09903048460831103, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014377536580800821}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.24509693147391448, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003518979975606831}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1393113978609222, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019655986810200457}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09661401587871966, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015465093492546976}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.23906516897153357, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003723173758494015}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13592809650365684, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021149395154476942}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.3894434901616817, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0696818577382309}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_gem_xsum_article_DOC_summary_2.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..7266e169619d58dc4814e2bf36e6e48b49769566 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12932415674769882, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018169766878992155}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.31588294560858055, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004216644148639617}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1812341104304252, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024420789648274964}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02882443972103835, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010221845705623207}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07321267293223659, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0026752083496981217}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04085037987286443, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014441866865235443}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10675121708053566, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014369855194212536}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.26192576739698237, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003428288975677526}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1497403639141996, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019366476236409818}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10009767181496847, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014618075217660356}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2471962036151299, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003570649420240086}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1406991990555183, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019931907678247163}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.519028859842843, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10932835465017057}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_gem_xsum_article_DOC_summary_3.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..0dccc470359c7838a45c0199b0e54350511dc0d3 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12669828356422383, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0020094917781438}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2991027968300709, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004591383921824911}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17398457366386533, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026011912639339633}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02846440216262034, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010956946533866802}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0706413058306802, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0027868384974826573}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03976972720010616, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015117103431558975}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10522998362089304, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016066968369183466}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.24989448115090335, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003818419767894932}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14481676263378276, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021155906125953196}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09817348971720044, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016441110742716834}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.23394639249573773, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0039702384387275}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13514679304649532, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002182435634289256}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.6370716620193742, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0965616345735323}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_gem_xsum_article_DOC_summary_4.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..408e9bc8817c6684b646ec7bb3227c2a035d3d91 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.04259238619227563, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0027101471976600064}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.07720379689124833, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0044603739276368026}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.05007677852098019, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0028520829549217}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.01039550194215322, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0013002683205402986}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.01810305312651028, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015721872697551358}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.011518858251746018, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00100875710859823}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.03523709895823149, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00227881816047799}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.06319492439650329, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0036104810452688464}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.04100139142500078, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002305891008745547}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.03483815068281454, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0023451054837002874}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.06212330010384987, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00366876474124129}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.040275422096666895, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023372301427381265}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.8669272479971863, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1405646989169273}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_gem_xsum_article_DOC_summary_5.json b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..13a116466212fb5a4864f6ecbb9ec152bb64d28e --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/agg.4b284b21bc4seed3_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.003588402424856072, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001048591574930412}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.0028604653610329457, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0007986614088290892}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.0031002107990313337, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008747175919556528}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0007923025611704858, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0003921450634363378}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0005498039696152904, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0002641981773098142}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0006390516220219271, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00030954190704298026}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0027648078129268614, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0008127087627131919}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0021867338334639443, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0006127280790696822}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.002386725038982092, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006780512190033147}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0030462311312536203, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0009151504800039854}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.0024328059752266973, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0006814073788898694}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.00262981517645366, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0007507411641340949}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.0463937563324107e-36, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 3.980151871433784e-31}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b4dfb97a2af14bf81618f60fe50f8715a79e59ad --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ac93dabc8b8700a78f8a27f87336cf7cd290be3a9f654ddda49c179d9107da7 +size 4126849 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..95b5c354dd11accb8b24e1a2f7c458e0267e7351 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5edcd70aa2c9bd6b44bda78763c41563980617c8a658bde5f0e89a80c754a40 +size 5112547 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..adcc56c94ba4ac18d77134a348b9c4f942f74c99 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a59ed3e9dddd2c0c887c14ebee328c0d68923bf10e9452d6df9c5c949856177 +size 6023099 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4454b2e75ac3fd017faf53d97006d4fa2a5c7087 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ada2aa5e2ff15bd2a9966feac7cc5c53fa67f9d1a5d559aa2026445517c62a32 +size 6932662 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..05ae1acc585b1e57335c8a14ead9daacf20d0d74 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c85fb0cc24a68668ebc69ccd9dbc6e26bed8320a9dc79c7869f8cd6a08381997 +size 7834296 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..34692fbfc5151945b752e5bf939b9fdd66214bce --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9087f214decdb5e9ddeae8a78c415f19513e6ab15c354560dd7e653ecd8c4efa +size 8744763 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..44edcb573770c29b14d81c0849dc7c7c6efe238b --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1b5215f774cb0eb8b2a67dfc0d76fa3008ba30aeac93b571df732023103dc62 +size 7687287 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2540e7b192cb8dfece3129da2d6ed0d0a55cb59e --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:608a5c8ac8b6613d5ebc4b1defbe032af31dd06126d25b0a545a04795e83b512 +size 13320296 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..323cf529ff4796f64f73f13be2d969fe82c166a5 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95a9465edcc787ed1df3c9a7c6d32f77c7024701de2d262f05a9daf3d8fb9843 +size 18906538 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..caf83acb9d1fbd3ae3fce55c7456299e51039f12 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f485f8ca6ff8f030c60a00a650e80d63e5ab2f1696509a9ceb82f0f22e895a3 +size 24321747 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4407dc3dd66529da2d996bb4f38c955117699876 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b37f110e03c28c8fba2b0ee5dfae102d1197b1beb69e0f35051b6464e1601906 +size 29470431 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..68ad17aca9b223805cbda3c3f9ed6157ae380518 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:031d5308bf7213bc5d1273187fe59077f25a4c93cfad2a89f2ebe92d2c25de3b +size 34798911 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1628a97aef51e5a72c7308cd74ecfaeed447e270 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bf6360f5ccfefa9aa38d8b2f67c5ec2988b53982564cf3621e5d9c4962e7c71 +size 3867928 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b76b4eb3ae8651504e287353aa94c3256e9aa0d2 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b3b1d1e31fc1a1d13e24cf4aa0d2b3ced6a0746025f1c06e03079b3ff3ea9f3 +size 5051386 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..96c5046e0d773f1bab99a8d89a8bab05b4dc7432 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e7dcd307671d37f211283dac747050b6c3ade7cb72108411885b9acd102b105 +size 6119353 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..844ad3a18f18cdd62a60a43e3a7dcd2ddfb8fa85 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5a70c37f5a7fd700e7e42c51086301cdeb336e97ea751d30ecfb5abb8101454 +size 7205539 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..04d6634f830269170c182da20a4420dfbf3bf645 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1778b74412100ad8a6ce02d2ab7f2c4c0db5b8d7fc726a07a300914aa89fce85 +size 8291229 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4964b92444942adb6cfc6ea112a9bde327455965 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9db1f81a4600df6adaf92b8672effe704919ecd543b5181473b150f955a0642a +size 9378722 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_gem_xsum_article_DOC_summary_0.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d49eb64947dba98d869c03f06175e46648b040f9 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:804bc8c2f87b77918eebf2c3c9623910f7707c5cf2d41cbdd90915fe75e42024 +size 2802723 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_gem_xsum_article_DOC_summary_1.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3c06dad6886a01dc7d9b79f4e2066685e392d62d --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6514d58c50aed26bb61d7ce5f1bda5b16861567bbc9ccd37c3995819bf8626e +size 5106968 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_gem_xsum_article_DOC_summary_2.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..05551746ab17bcfe0ae496f4a0753e4eda0c34d5 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dd6d9bdd6728b4239139e385db3960d3b61ff6e0605dc462847a7d8d4ec5d8a +size 7381412 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_gem_xsum_article_DOC_summary_3.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..fce84a0cbe1b174117be391e624a5c60ad779e8c --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84fa582a564d16cc4fdc2890de52f14954a8a1cfe955f7541d8293e1efff1ea6 +size 9648203 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_gem_xsum_article_DOC_summary_4.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..cc6dc870d511b710b75bd31691aa0318ffe2af8c --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb0fe85ecd0c8f904ee5a1eff423372921e08b6c81608072836b0627ce4c0d1e +size 11672785 diff --git a/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_gem_xsum_article_DOC_summary_5.jsonl b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..dc5606e8075d696f79668fd4cd0c506ba4e3bf8b --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/examples.4b284b21bc4seed3_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d343ffc163c2a772317ec6ffbb3f1804cfb868fe2d3098220a631cf2f3fe146 +size 13897506 diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..b5fd0b04b8ac3abcd4436042e500f91f79d8fd4f --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.38535441961499517, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03552663485548509 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07392314530016614, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0017416928662543226 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.31161026039179884, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0047814670849113125 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11065558909994337, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020016224462212732 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03387963683203527, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009418685192906572 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.15167229813850266, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003249849487394629 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.052101576521840554, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001254434060918415 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07143509621818969, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0016292918867949191 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.30392322887986606, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004670559568432556 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10721119439428567, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001872014217214712 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.0707943641461647, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0016472302036406458 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2986281388001843, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0045364052998747 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10596966360979974, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001881280054371966 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..2b5e4b641455e8706693d19d36c8ddb79145c350 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5512129467367316, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0395418255366758 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.08196746460318716, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014754369831595647 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.40914147014095936, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0053861796031930845 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.1276921926781691, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018832476710271726 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03760548245806836, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008485772447386252 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.2004779256099399, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0039022297404803946 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05919617667381684, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012055006346489835 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07759729021254366, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013607454921227458 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.38809219654571864, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.005037385606363737 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.12093972964797003, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0017235569265706195 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07790072285955618, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.00140465482895153 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.38623053862621287, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004945962835138011 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.12119435037639528, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001776101552985325 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..dd0da2f4cb1a22081a4c288e9587b6e4bd2f6992 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5933018254177376, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.032599794867965604 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.08138207976281618, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001320028581758322 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.41969083219702635, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0051938217749552314 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12805421977747078, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017731859601500346 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03774533356166905, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008138836014742545 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.21183011597903806, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0039019044052842713 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05973961241278947, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011408079330925724 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07647361432812638, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001197053850440824 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3943345910974271, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004791104064669637 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.12034876582957013, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016107770822709627 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07733964505952771, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001246953646848645 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3972043924885929, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0047988833920575725 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.12158519620974508, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016694470344012931 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..950f0afc85bb37965562f2d7151df6f59c3469a4 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6676820645573561, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.029698241159243657 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.08199443734871886, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013044083678416126 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4326296696301956, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005319027568329476 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12983004472435894, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017904512351955197 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03836456544897309, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008016019880007896 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.2182970907135364, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0039434390311428045 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.06110341345845585, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011495434475286368 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07660172161550755, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011750201739650409 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.4026463135770865, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004800741095877209 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.12124821447948028, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016083744034722292 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07783198204724436, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012330922500882204 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.40862496584299657, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004878219295388798 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.12313018758539385, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016863121667983272 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..040fa7dbdf4fe8ee437280d9309471f813f2ef36 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6836151545167003, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.029089321693769803 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.08237641519365944, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012712811379550952 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4410392252234467, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005252924753314178 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.13090538213539582, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017570477742261594 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.038294697830682935, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007935145188603823 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.22196349128777046, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0039874400036358035 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.061203868765094024, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001147850507777741 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07647361824568906, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011522230823326422 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.40690715092516466, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0047151717706141886 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.12140909248039315, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.00158909093789567 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07814715491035078, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012030810779768226 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.4163700311086396, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00483547149960936 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.12407530125753383, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016569917198277998 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..79e4ea5fa0a8bde76c9564f7c8d1273cba089989 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.770273022704267, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.034315297186777595 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.08203708357705593, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012436710783140608 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4527088578344478, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005270512909014665 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.13101067212098677, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017066218312728107 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03796634902700147, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007628000916252061 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.23182459931655927, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.004137297126449473 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.061162270106061005, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001104511682001034 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07531042150309193, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011067305255883584 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.41469386205754033, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004724284504576538 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.12018039624183414, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015114350444937687 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07740826323217029, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011667399100477348 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.426759509472668, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004893799458515002 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1235732065654381, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015991738579748697 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..54573ed61862477483b83185aca88d5ab7bbdb6e --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.15679162263674679, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0019991369518845767 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2689745748726192, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0029016224540331552 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.18416362480898446, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019831229958442082 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.03467120760519669, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008221744008462381 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06209758141565476, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015832249597357217 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04094718247147155, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009244238662338802 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.12082089693911753, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014097474863449463 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.2144029920856489, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002350903120057298 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.14338902877501125, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014226956074527863 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1433977232378843, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018222721919399013 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.24699886538862653, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0026942999677837982 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1686525979999314, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018124703517444088 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.8921440063023223, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.07135112924486753 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..3a8c17c9e1c28bfc3670c3e3d5a2256df408a952 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.18997860617259896, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0021315131916909724 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.31970644615930655, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0028665402668271315 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.22027730929537712, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019608589609497263 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.046578501178857534, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009806080013812627 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.08133508293170587, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0017593067161220152 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05398367197056974, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010308834876363582 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1329141418602316, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014073779291519839 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.23157078499816725, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002239708119405446 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15563014047034032, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013088183409122065 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1786247909527116, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0020029209788265186 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.3014126188767162, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027138736966177968 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.2072131798418733, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018385432787880404 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.8056438776711543, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0837473028373607 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..7157ce8d358c96a682f68e7d8ca253738955df93 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.19848212426092088, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0023139570614517783 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.31608172323314615, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0027622954997235665 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.22219895534581124, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019115852755068978 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.049990983654620055, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0011071845883649219 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.08099563488003071, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0017279951131225705 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05522229843864866, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010366643780952015 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1388108427148649, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0016626769142365268 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.22710405861686703, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022002521830572098 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15589253405198344, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012973150218916173 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.18757113799557207, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0021914037253074584 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2994878980311641, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0026463012724863054 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.2100590256285955, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018001298788378707 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.9780392590967417, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.07485005723665485 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..8454597e77767b1b69984075362877eb7e60cd4c --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.17134837432784916, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002648910653676966 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.25800000600290435, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.003313810821871368 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.18197691858961074, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002206594668965237 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.04161503586356084, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0011270454940689701 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06562904781876294, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016912238278118353 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.044357885260241585, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009768044123671569 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.12351815672543218, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002041531952456252 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.18830813752138773, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0025923821492611896 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13010623261113158, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015513282273767694 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.16212518594924535, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0025194852893668154 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.24439649503938565, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0031617457131678586 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.17213683153876608, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020822081122974664 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.847512210211642, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.08130288880844025 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..10274a2153dbfc5fff726ddd187d81236200f464 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.05513001019844826, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.00215178654051168 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.08454226315750968, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002935250128250436 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.057107296289159025, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019494380017288225 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.013800421209577515, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000858478532665541 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.021959372595934164, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001194364786706014 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.014135921586219569, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0006914493317450905 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.04128275764961394, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0016823042515051513 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.0637605084786262, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022692310247988275 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.04216170229604133, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014236179778487777 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.051975929888249256, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002028731950450667 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.07986443919003557, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027755366306270973 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.05379079735955767, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018282128528245283 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.6551089372553552, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04895444931980532 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..63b46f089db46fb4d069bd18b696795840a7700f --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.009676230361373621, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0010092112696239383 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.014009287778858652, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0013693091057835286 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.009311675141314384, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0008747369590243084 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.002516778405932201, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0003813647101277748 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.004189787625575326, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0006261364681498638 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.002405387772695905, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00030042578765582695 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.007375708880019688, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0007995038887537955 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.010624417220719972, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0010701965664864565 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.006932807281073693, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0006486704498845653 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.009118809831121096, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0009682743549182715 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.01302829985395723, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0012830127121259097 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.008662236702193958, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0008161476026799892 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 9.282109221159003e-07, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 2.2223612520502284e-06 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..d3620ed030c637f080243706dfd605e029eb5158 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 0.6114974539510816, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.04527113203185075 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.05869533205508546, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.001497949313805969 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.03571922348667764, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0013948024749901261 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.03492593073320387, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0010376513872745155 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.004063213985026975, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0003541545577591494 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.006573047412918524, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0005456263764429907 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.004517028931517297, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.00036439768835932237 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.05805625987920658, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0014726688390761706 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.03532952206585685, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0013716820040930184 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.03456601494605734, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0010229273732960667 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.057416666705387066, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.001471227198507916 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.033493295914568566, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0012685265746055889 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.033356146432655866, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0009612249675140079 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..d1b1e719e9394bd6ad03fb69f6b63784713af1e4 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.33447911090928, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.14535102796873467 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5083802018676299, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032791833916447554 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.42190893586204214, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002971819042737358 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.433797396683994, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022987607409721217 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.23512517549601986, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0025920962511690763 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.19142011398550732, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021166855984481392 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.19719568941249035, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019377495452543357 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.37102243518103833, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002904005844748298 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.30457624020087987, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024007135826919603 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.31401062106699107, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0019834092080858665 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.41705381489741356, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003122960946648587 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.34480646003082416, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027214625950243783 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3549188128484648, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002246841679471083 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..193cfcd1da5b293d2d563d1c659cc4c23c4ae044 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.915730606248113, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.20474125011289426 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5479863902027133, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032369184668208516 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.441447062617084, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029152320911209556 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4631809810602233, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002254496022709034 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2694942093855683, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002668904008037024 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2131243378825482, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021529009824731303 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.22387083492928028, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019825042986668373 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4057365701684737, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029348734509084765 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3240876063453124, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002423564725696539 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.34081459166299144, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002030967494387809 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.45419008644409004, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031526651706947012 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3644738218767085, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027027920241602162 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.382975161960982, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022658855724966864 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..c9b5e80169f465bc35454b92e2810868532a2a7e --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.799049670661745, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1818766642053644 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5538154552713349, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032031754343585057 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4530213630135714, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002889071639596583 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4733021068886725, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002229748270982301 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2776711960124572, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002669354319886314 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.22402395817155157, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022252252780088967 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.23393615456741612, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020284322092199397 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4112498098162674, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002912753431059431 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.33431398302211607, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024572409829041286 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.34984277963163096, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020650055785518843 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.46138958037109395, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031283915205367083 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.37645205860452513, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027190821967377665 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3937728879658398, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022887568890525446 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..fcd33b933383278d704c380d897f8ae8ef78a32b --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.332946979780699, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.187321161876581 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5502767036745366, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032191855076160905 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4601167935637563, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002933097976024252 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.47698101030399137, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002304125507421037 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2764817164388747, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002683961252587485 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.22893953263224417, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002301850243468405 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.23686616389681567, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020891392412113624 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4088077687087317, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029284110175963112 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.34034029264854043, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002546438349753808 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.35299999087704836, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002138766539340371 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.46022437266752997, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031504453494794983 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.38497978756866746, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.00282067010132265 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3988932621808988, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002365288784954707 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..574df007bd08cf7708c0b2d683aadcfe0fa0d23e --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.123246792588205, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.18981316484333496 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5508575470527967, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003172543361692212 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4596250362933734, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028838674948470076 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4771521080848, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002247583418148515 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.27785561114819307, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026789931891456594 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.22893900538597906, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002250810965306422 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.23757613806327457, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020631855681245196 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4128922710964347, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029408076764540847 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3432096183345724, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025317938331892898 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.35646844538814754, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002140481161608752 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.46456472542175714, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031248622936883626 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3874763961501519, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027737834865428587 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4021976919673297, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023234845320029575 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_gem_xsum_article_DOC_summary_0.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..5e3796b33288dd012267924edb57c23daa7935b5 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.15967577438396582, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002367262573167645 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3344097957704383, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004542927765114456 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.20731019337768042, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0026329404650807355 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03607001702892568, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.001380428573706143 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.08085696005427423, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0028599271086292063 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04779740432400501, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0016427567157124747 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.12124210013250766, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0018353599935403793 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.25607740438919824, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0036003883952627205 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1576331231529663, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019951539963787477 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.1242181328811872, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0019619556407432866 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.26337373173306655, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.004025744770152854 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.16181781523790845, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0022319416867268445 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.949120361010708, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.0913394024073436 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_gem_xsum_article_DOC_summary_1.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..afb6cafe1910871764bae3b49d6e76c87890e3a3 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12169091971501833, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018485062787122516 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2985653730389386, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004290053847052186 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17081587570763854, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002498720216403539 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02579297493046093, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010284490730061247 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06657394965502363, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0027184784375237805 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03675651772088566, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014655540573612757 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09903048460831103, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0014377536580800821 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.24509693147391448, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003518979975606831 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1393113978609222, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019655986810200457 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09661401587871966, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0015465093492546976 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.23906516897153357, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003723173758494015 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13592809650365684, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0021149395154476942 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.3894434901616817, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.0696818577382309 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_gem_xsum_article_DOC_summary_2.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..57a6ade830fc779649ce63975683e6535abc1598 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12932415674769882, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018169766878992155 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.31588294560858055, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004216644148639617 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1812341104304252, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0024420789648274964 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02882443972103835, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010221845705623207 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07321267293223659, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0026752083496981217 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04085037987286443, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014441866865235443 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10675121708053566, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0014369855194212536 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.26192576739698237, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003428288975677526 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1497403639141996, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019366476236409818 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10009767181496847, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014618075217660356 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2471962036151299, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003570649420240086 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1406991990555183, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0019931907678247163 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.519028859842843, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.10932835465017057 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_gem_xsum_article_DOC_summary_3.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..5dde9245475d99af3c524d880230fce85816d776 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12669828356422383, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0020094917781438 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2991027968300709, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004591383921824911 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17398457366386533, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0026011912639339633 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02846440216262034, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010956946533866802 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0706413058306802, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0027868384974826573 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03976972720010616, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0015117103431558975 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10522998362089304, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0016066968369183466 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.24989448115090335, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003818419767894932 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14481676263378276, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0021155906125953196 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09817348971720044, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0016441110742716834 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.23394639249573773, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0039702384387275 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13514679304649532, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002182435634289256 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.6370716620193742, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.0965616345735323 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_gem_xsum_article_DOC_summary_4.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..b73f088ce3287eea27a74de2214ecbb392ff9b5b --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.04259238619227563, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0027101471976600064 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.07720379689124833, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0044603739276368026 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.05007677852098019, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0028520829549217 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.01039550194215322, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0013002683205402986 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.01810305312651028, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0015721872697551358 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.011518858251746018, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00100875710859823 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.03523709895823149, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.00227881816047799 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.06319492439650329, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0036104810452688464 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.04100139142500078, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002305891008745547 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.03483815068281454, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0023451054837002874 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.06212330010384987, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.00366876474124129 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.040275422096666895, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0023372301427381265 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.8669272479971863, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.1405646989169273 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_gem_xsum_article_DOC_summary_5.json b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..7ce56049e6ef9b3d434b8d9a5ba6bcdfe3017af0 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/generation/slim.4b284b21bc4seed3_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.003588402424856072, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.001048591574930412 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.0028604653610329457, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0007986614088290892 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.0031002107990313337, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0008747175919556528 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0007923025611704858, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0003921450634363378 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0005498039696152904, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0002641981773098142 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0006390516220219271, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00030954190704298026 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0027648078129268614, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0008127087627131919 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0021867338334639443, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0006127280790696822 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.002386725038982092, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0006780512190033147 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0030462311312536203, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0009151504800039854 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.0024328059752266973, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0006814073788898694 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.00262981517645366, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0007507411641340949 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.0463937563324107e-36, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 3.980151871433784e-31 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_0.json b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_0.json new file mode 100644 index 0000000000000000000000000000000000000000..202e8a628e77ed9a6d201409499ca76c31bd688f --- /dev/null +++ b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.336, + "acc_stderr": 0.014944140233795027 + }, + "anli_r2": { + "acc": 0.329, + "acc_stderr": 0.014865395385928364 + }, + "anli_r3": { + "acc": 0.34833333333333333, + "acc_stderr": 0.013759437498874072 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.0672477765493766, + "f1": 0.3271604938271605 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932261 + }, + "hellaswag": { + "acc": 0.47410874327823144, + "acc_stderr": 0.004983087049281741, + "acc_norm": 0.619896434973113, + "acc_norm_stderr": 0.004844199910173022 + }, + "rte": { + "acc": 0.5451263537906137, + "acc_stderr": 0.029973636495415252 + }, + "winogrande": { + "acc": 0.585635359116022, + "acc_stderr": 0.013844846232268563 + }, + "storycloze_2016": { + "acc": 0.726349545697488, + "acc_stderr": 0.0103097970944971 + }, + "boolq": { + "acc": 0.6201834862385321, + "acc_stderr": 0.008488668235778617 + }, + "arc_easy": { + "acc": 0.5909090909090909, + "acc_stderr": 0.010088775152615786, + "acc_norm": 0.5311447811447811, + "acc_norm_stderr": 0.010239860250021745 + }, + "arc_challenge": { + "acc": 0.2713310580204778, + "acc_stderr": 0.01299380772754579, + "acc_norm": 0.295221843003413, + "acc_norm_stderr": 0.013329750293382318 + }, + "sciq": { + "acc": 0.843, + "acc_stderr": 0.01151014697923019, + "acc_norm": 0.755, + "acc_norm_stderr": 0.013607356839598123 + }, + "piqa": { + "acc": 0.7595212187159956, + "acc_stderr": 0.009971345364651078, + "acc_norm": 0.764417845484222, + "acc_norm_stderr": 0.009901067586473883 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_0_lm-eval_global_step80108_2023-02-15-11-04-04_0shots_backup.json b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_0_lm-eval_global_step80108_2023-02-15-11-04-04_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..202e8a628e77ed9a6d201409499ca76c31bd688f --- /dev/null +++ b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_0_lm-eval_global_step80108_2023-02-15-11-04-04_0shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.336, + "acc_stderr": 0.014944140233795027 + }, + "anli_r2": { + "acc": 0.329, + "acc_stderr": 0.014865395385928364 + }, + "anli_r3": { + "acc": 0.34833333333333333, + "acc_stderr": 0.013759437498874072 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.0672477765493766, + "f1": 0.3271604938271605 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932261 + }, + "hellaswag": { + "acc": 0.47410874327823144, + "acc_stderr": 0.004983087049281741, + "acc_norm": 0.619896434973113, + "acc_norm_stderr": 0.004844199910173022 + }, + "rte": { + "acc": 0.5451263537906137, + "acc_stderr": 0.029973636495415252 + }, + "winogrande": { + "acc": 0.585635359116022, + "acc_stderr": 0.013844846232268563 + }, + "storycloze_2016": { + "acc": 0.726349545697488, + "acc_stderr": 0.0103097970944971 + }, + "boolq": { + "acc": 0.6201834862385321, + "acc_stderr": 0.008488668235778617 + }, + "arc_easy": { + "acc": 0.5909090909090909, + "acc_stderr": 0.010088775152615786, + "acc_norm": 0.5311447811447811, + "acc_norm_stderr": 0.010239860250021745 + }, + "arc_challenge": { + "acc": 0.2713310580204778, + "acc_stderr": 0.01299380772754579, + "acc_norm": 0.295221843003413, + "acc_norm_stderr": 0.013329750293382318 + }, + "sciq": { + "acc": 0.843, + "acc_stderr": 0.01151014697923019, + "acc_norm": 0.755, + "acc_norm_stderr": 0.013607356839598123 + }, + "piqa": { + "acc": 0.7595212187159956, + "acc_stderr": 0.009971345364651078, + "acc_norm": 0.764417845484222, + "acc_norm_stderr": 0.009901067586473883 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_1.json b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_1.json new file mode 100644 index 0000000000000000000000000000000000000000..c092ca2613a7e0c3f70e027ce8d975f7238094e5 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.33, + "acc_stderr": 0.01487687202745673 + }, + "anli_r2": { + "acc": 0.318, + "acc_stderr": 0.0147340793093119 + }, + "anli_r3": { + "acc": 0.3491666666666667, + "acc_stderr": 0.013767075395077247 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.06724777654937658, + "f1": 0.3333333333333333 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932262 + }, + "hellaswag": { + "acc": 0.46853216490738897, + "acc_stderr": 0.004979889597551665, + "acc_norm": 0.6188010356502689, + "acc_norm_stderr": 0.004846886929763445 + }, + "rte": { + "acc": 0.5523465703971119, + "acc_stderr": 0.02993107036293953 + }, + "winogrande": { + "acc": 0.580110497237569, + "acc_stderr": 0.013870943986310391 + }, + "storycloze_2016": { + "acc": 0.7145911277391769, + "acc_stderr": 0.010443395884062115 + }, + "boolq": { + "acc": 0.6214067278287462, + "acc_stderr": 0.00848334171802448 + }, + "arc_easy": { + "acc": 0.6077441077441077, + "acc_stderr": 0.010018744689650043, + "acc_norm": 0.5702861952861953, + "acc_norm_stderr": 0.010157908005763674 + }, + "arc_challenge": { + "acc": 0.29436860068259385, + "acc_stderr": 0.013318528460539426, + "acc_norm": 0.31569965870307165, + "acc_norm_stderr": 0.013582571095815291 + }, + "sciq": { + "acc": 0.887, + "acc_stderr": 0.010016552866696855, + "acc_norm": 0.856, + "acc_norm_stderr": 0.01110798754893915 + }, + "piqa": { + "acc": 0.750272034820457, + "acc_stderr": 0.010099232969867483, + "acc_norm": 0.7573449401523396, + "acc_norm_stderr": 0.010002002569708688 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_1_lm-eval_global_step80108_2023-02-15-11-04-05_1shots_backup.json b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_1_lm-eval_global_step80108_2023-02-15-11-04-05_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..c092ca2613a7e0c3f70e027ce8d975f7238094e5 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_1_lm-eval_global_step80108_2023-02-15-11-04-05_1shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.33, + "acc_stderr": 0.01487687202745673 + }, + "anli_r2": { + "acc": 0.318, + "acc_stderr": 0.0147340793093119 + }, + "anli_r3": { + "acc": 0.3491666666666667, + "acc_stderr": 0.013767075395077247 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.06724777654937658, + "f1": 0.3333333333333333 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932262 + }, + "hellaswag": { + "acc": 0.46853216490738897, + "acc_stderr": 0.004979889597551665, + "acc_norm": 0.6188010356502689, + "acc_norm_stderr": 0.004846886929763445 + }, + "rte": { + "acc": 0.5523465703971119, + "acc_stderr": 0.02993107036293953 + }, + "winogrande": { + "acc": 0.580110497237569, + "acc_stderr": 0.013870943986310391 + }, + "storycloze_2016": { + "acc": 0.7145911277391769, + "acc_stderr": 0.010443395884062115 + }, + "boolq": { + "acc": 0.6214067278287462, + "acc_stderr": 0.00848334171802448 + }, + "arc_easy": { + "acc": 0.6077441077441077, + "acc_stderr": 0.010018744689650043, + "acc_norm": 0.5702861952861953, + "acc_norm_stderr": 0.010157908005763674 + }, + "arc_challenge": { + "acc": 0.29436860068259385, + "acc_stderr": 0.013318528460539426, + "acc_norm": 0.31569965870307165, + "acc_norm_stderr": 0.013582571095815291 + }, + "sciq": { + "acc": 0.887, + "acc_stderr": 0.010016552866696855, + "acc_norm": 0.856, + "acc_norm_stderr": 0.01110798754893915 + }, + "piqa": { + "acc": 0.750272034820457, + "acc_stderr": 0.010099232969867483, + "acc_norm": 0.7573449401523396, + "acc_norm_stderr": 0.010002002569708688 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_2.json b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_2.json new file mode 100644 index 0000000000000000000000000000000000000000..42328347da9ac54bcf526e47084be1d4427cae43 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.332, + "acc_stderr": 0.014899597242811475 + }, + "anli_r2": { + "acc": 0.333, + "acc_stderr": 0.014910846164229864 + }, + "anli_r3": { + "acc": 0.34, + "acc_stderr": 0.013680495725767797 + }, + "cb": { + "acc": 0.35714285714285715, + "acc_stderr": 0.06460957383809218, + "f1": 0.2528248587570622 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.46932881896036643, + "acc_stderr": 0.004980384575535383, + "acc_norm": 0.6172077275443139, + "acc_norm_stderr": 0.0048507486878599185 + }, + "rte": { + "acc": 0.4693140794223827, + "acc_stderr": 0.03003973059219781 + }, + "winogrande": { + "acc": 0.5927387529597474, + "acc_stderr": 0.013808654122417862 + }, + "storycloze_2016": { + "acc": 0.7183324425440941, + "acc_stderr": 0.010401844358587665 + }, + "boolq": { + "acc": 0.6180428134556575, + "acc_stderr": 0.00849785199842719 + }, + "arc_easy": { + "acc": 0.6195286195286195, + "acc_stderr": 0.009962305992058577, + "acc_norm": 0.5959595959595959, + "acc_norm_stderr": 0.01006906164954955 + }, + "arc_challenge": { + "acc": 0.295221843003413, + "acc_stderr": 0.01332975029338232, + "acc_norm": 0.30802047781569963, + "acc_norm_stderr": 0.013491429517292038 + }, + "sciq": { + "acc": 0.896, + "acc_stderr": 0.009658016218524301, + "acc_norm": 0.871, + "acc_norm_stderr": 0.010605256784796586 + }, + "piqa": { + "acc": 0.7464635473340587, + "acc_stderr": 0.010150090834551794, + "acc_norm": 0.7573449401523396, + "acc_norm_stderr": 0.010002002569708688 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_2_lm-eval_global_step80108_2023-02-15-11-04-04_2shots_backup.json b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_2_lm-eval_global_step80108_2023-02-15-11-04-04_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..42328347da9ac54bcf526e47084be1d4427cae43 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_2_lm-eval_global_step80108_2023-02-15-11-04-04_2shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.332, + "acc_stderr": 0.014899597242811475 + }, + "anli_r2": { + "acc": 0.333, + "acc_stderr": 0.014910846164229864 + }, + "anli_r3": { + "acc": 0.34, + "acc_stderr": 0.013680495725767797 + }, + "cb": { + "acc": 0.35714285714285715, + "acc_stderr": 0.06460957383809218, + "f1": 0.2528248587570622 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.46932881896036643, + "acc_stderr": 0.004980384575535383, + "acc_norm": 0.6172077275443139, + "acc_norm_stderr": 0.0048507486878599185 + }, + "rte": { + "acc": 0.4693140794223827, + "acc_stderr": 0.03003973059219781 + }, + "winogrande": { + "acc": 0.5927387529597474, + "acc_stderr": 0.013808654122417862 + }, + "storycloze_2016": { + "acc": 0.7183324425440941, + "acc_stderr": 0.010401844358587665 + }, + "boolq": { + "acc": 0.6180428134556575, + "acc_stderr": 0.00849785199842719 + }, + "arc_easy": { + "acc": 0.6195286195286195, + "acc_stderr": 0.009962305992058577, + "acc_norm": 0.5959595959595959, + "acc_norm_stderr": 0.01006906164954955 + }, + "arc_challenge": { + "acc": 0.295221843003413, + "acc_stderr": 0.01332975029338232, + "acc_norm": 0.30802047781569963, + "acc_norm_stderr": 0.013491429517292038 + }, + "sciq": { + "acc": 0.896, + "acc_stderr": 0.009658016218524301, + "acc_norm": 0.871, + "acc_norm_stderr": 0.010605256784796586 + }, + "piqa": { + "acc": 0.7464635473340587, + "acc_stderr": 0.010150090834551794, + "acc_norm": 0.7573449401523396, + "acc_norm_stderr": 0.010002002569708688 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_3.json b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_3.json new file mode 100644 index 0000000000000000000000000000000000000000..2a00a3b600e1cb988fff6461cd325153c7c9819e --- /dev/null +++ b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.328, + "acc_stderr": 0.014853842487270333 + }, + "anli_r2": { + "acc": 0.351, + "acc_stderr": 0.015100563798316409 + }, + "anli_r3": { + "acc": 0.34833333333333333, + "acc_stderr": 0.013759437498874086 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.06633634150359541, + "f1": 0.3815668202764977 + }, + "copa": { + "acc": 0.8, + "acc_stderr": 0.04020151261036845 + }, + "hellaswag": { + "acc": 0.46863174666401114, + "acc_stderr": 0.004979952166595543, + "acc_norm": 0.6213901613224457, + "acc_norm_stderr": 0.0048404936031661945 + }, + "rte": { + "acc": 0.5090252707581228, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.574585635359116, + "acc_stderr": 0.013895257666646378 + }, + "storycloze_2016": { + "acc": 0.7258150721539284, + "acc_stderr": 0.010316062787590006 + }, + "boolq": { + "acc": 0.6058103975535168, + "acc_stderr": 0.008546995661233634 + }, + "arc_easy": { + "acc": 0.6165824915824916, + "acc_stderr": 0.009976995068264717, + "acc_norm": 0.6060606060606061, + "acc_norm_stderr": 0.010026305355981814 + }, + "arc_challenge": { + "acc": 0.30119453924914674, + "acc_stderr": 0.01340674176784762, + "acc_norm": 0.31143344709897613, + "acc_norm_stderr": 0.013532472099850947 + }, + "sciq": { + "acc": 0.903, + "acc_stderr": 0.009363689373248088, + "acc_norm": 0.891, + "acc_norm_stderr": 0.009859828407037185 + }, + "piqa": { + "acc": 0.7611534276387377, + "acc_stderr": 0.0099481203853375, + "acc_norm": 0.7600652883569097, + "acc_norm_stderr": 0.009963625892809545 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_3_lm-eval_global_step80108_2023-02-15-11-04-04_3shots_backup.json b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_3_lm-eval_global_step80108_2023-02-15-11-04-04_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..2a00a3b600e1cb988fff6461cd325153c7c9819e --- /dev/null +++ b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_3_lm-eval_global_step80108_2023-02-15-11-04-04_3shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.328, + "acc_stderr": 0.014853842487270333 + }, + "anli_r2": { + "acc": 0.351, + "acc_stderr": 0.015100563798316409 + }, + "anli_r3": { + "acc": 0.34833333333333333, + "acc_stderr": 0.013759437498874086 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.06633634150359541, + "f1": 0.3815668202764977 + }, + "copa": { + "acc": 0.8, + "acc_stderr": 0.04020151261036845 + }, + "hellaswag": { + "acc": 0.46863174666401114, + "acc_stderr": 0.004979952166595543, + "acc_norm": 0.6213901613224457, + "acc_norm_stderr": 0.0048404936031661945 + }, + "rte": { + "acc": 0.5090252707581228, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.574585635359116, + "acc_stderr": 0.013895257666646378 + }, + "storycloze_2016": { + "acc": 0.7258150721539284, + "acc_stderr": 0.010316062787590006 + }, + "boolq": { + "acc": 0.6058103975535168, + "acc_stderr": 0.008546995661233634 + }, + "arc_easy": { + "acc": 0.6165824915824916, + "acc_stderr": 0.009976995068264717, + "acc_norm": 0.6060606060606061, + "acc_norm_stderr": 0.010026305355981814 + }, + "arc_challenge": { + "acc": 0.30119453924914674, + "acc_stderr": 0.01340674176784762, + "acc_norm": 0.31143344709897613, + "acc_norm_stderr": 0.013532472099850947 + }, + "sciq": { + "acc": 0.903, + "acc_stderr": 0.009363689373248088, + "acc_norm": 0.891, + "acc_norm_stderr": 0.009859828407037185 + }, + "piqa": { + "acc": 0.7611534276387377, + "acc_stderr": 0.0099481203853375, + "acc_norm": 0.7600652883569097, + "acc_norm_stderr": 0.009963625892809545 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_4.json b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_4.json new file mode 100644 index 0000000000000000000000000000000000000000..feb5094ffb22482946bbcd9bbd20d27c44b5f997 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.353, + "acc_stderr": 0.015120172605483699 + }, + "anli_r2": { + "acc": 0.36, + "acc_stderr": 0.015186527932040127 + }, + "anli_r3": { + "acc": 0.3641666666666667, + "acc_stderr": 0.013896714966807265 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644647, + "f1": 0.4129474011826953 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.041633319989322626 + }, + "hellaswag": { + "acc": 0.466938856801434, + "acc_stderr": 0.004978861409119803, + "acc_norm": 0.6222863971320454, + "acc_norm_stderr": 0.004838246410786256 + }, + "rte": { + "acc": 0.49097472924187724, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.585635359116022, + "acc_stderr": 0.013844846232268563 + }, + "storycloze_2016": { + "acc": 0.7300908605024051, + "acc_stderr": 0.01026541350322146 + }, + "boolq": { + "acc": 0.6220183486238532, + "acc_stderr": 0.008480656964585248 + }, + "arc_easy": { + "acc": 0.6233164983164983, + "acc_stderr": 0.00994284807747617, + "acc_norm": 0.6077441077441077, + "acc_norm_stderr": 0.010018744689650043 + }, + "arc_challenge": { + "acc": 0.3003412969283277, + "acc_stderr": 0.013395909309956999, + "acc_norm": 0.3148464163822526, + "acc_norm_stderr": 0.01357265770308495 + }, + "sciq": { + "acc": 0.904, + "acc_stderr": 0.009320454434783248, + "acc_norm": 0.898, + "acc_norm_stderr": 0.009575368801653897 + }, + "piqa": { + "acc": 0.7524483133841132, + "acc_stderr": 0.010069703966857106, + "acc_norm": 0.7584330794341676, + "acc_norm_stderr": 0.009986718001804453 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_4_lm-eval_global_step80108_2023-02-15-11-04-04_4shots_backup.json b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_4_lm-eval_global_step80108_2023-02-15-11-04-04_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..feb5094ffb22482946bbcd9bbd20d27c44b5f997 --- /dev/null +++ b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_4_lm-eval_global_step80108_2023-02-15-11-04-04_4shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.353, + "acc_stderr": 0.015120172605483699 + }, + "anli_r2": { + "acc": 0.36, + "acc_stderr": 0.015186527932040127 + }, + "anli_r3": { + "acc": 0.3641666666666667, + "acc_stderr": 0.013896714966807265 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644647, + "f1": 0.4129474011826953 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.041633319989322626 + }, + "hellaswag": { + "acc": 0.466938856801434, + "acc_stderr": 0.004978861409119803, + "acc_norm": 0.6222863971320454, + "acc_norm_stderr": 0.004838246410786256 + }, + "rte": { + "acc": 0.49097472924187724, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.585635359116022, + "acc_stderr": 0.013844846232268563 + }, + "storycloze_2016": { + "acc": 0.7300908605024051, + "acc_stderr": 0.01026541350322146 + }, + "boolq": { + "acc": 0.6220183486238532, + "acc_stderr": 0.008480656964585248 + }, + "arc_easy": { + "acc": 0.6233164983164983, + "acc_stderr": 0.00994284807747617, + "acc_norm": 0.6077441077441077, + "acc_norm_stderr": 0.010018744689650043 + }, + "arc_challenge": { + "acc": 0.3003412969283277, + "acc_stderr": 0.013395909309956999, + "acc_norm": 0.3148464163822526, + "acc_norm_stderr": 0.01357265770308495 + }, + "sciq": { + "acc": 0.904, + "acc_stderr": 0.009320454434783248, + "acc_norm": 0.898, + "acc_norm_stderr": 0.009575368801653897 + }, + "piqa": { + "acc": 0.7524483133841132, + "acc_stderr": 0.010069703966857106, + "acc_norm": 0.7584330794341676, + "acc_norm_stderr": 0.009986718001804453 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_5.json b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_5.json new file mode 100644 index 0000000000000000000000000000000000000000..0b980e8b40156ef5badcb4720f1f9b73674485fb --- /dev/null +++ b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.361, + "acc_stderr": 0.015195720118175124 + }, + "anli_r2": { + "acc": 0.332, + "acc_stderr": 0.014899597242811475 + }, + "anli_r3": { + "acc": 0.3441666666666667, + "acc_stderr": 0.013720551062295755 + }, + "cb": { + "acc": 0.44642857142857145, + "acc_stderr": 0.06703189227942398, + "f1": 0.3336203597397627 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.4676359290977893, + "acc_stderr": 0.004979317515432522, + "acc_norm": 0.6258713403704441, + "acc_norm_stderr": 0.004829081532826523 + }, + "rte": { + "acc": 0.5054151624548736, + "acc_stderr": 0.030094698123239966 + }, + "winogrande": { + "acc": 0.5816890292028414, + "acc_stderr": 0.013863669961195908 + }, + "storycloze_2016": { + "acc": 0.721004810261892, + "acc_stderr": 0.010371620932652793 + }, + "boolq": { + "acc": 0.6152905198776758, + "acc_stderr": 0.008509403073229692 + }, + "arc_easy": { + "acc": 0.6245791245791246, + "acc_stderr": 0.0099362185271143, + "acc_norm": 0.6199494949494949, + "acc_norm_stderr": 0.009960175831493131 + }, + "arc_challenge": { + "acc": 0.30631399317406144, + "acc_stderr": 0.013470584417276513, + "acc_norm": 0.32337883959044367, + "acc_norm_stderr": 0.013669421630012122 + }, + "sciq": { + "acc": 0.913, + "acc_stderr": 0.008916866630745913, + "acc_norm": 0.904, + "acc_norm_stderr": 0.009320454434783217 + }, + "piqa": { + "acc": 0.7529923830250272, + "acc_stderr": 0.010062268140772629, + "acc_norm": 0.7540805223068553, + "acc_norm_stderr": 0.010047331865625184 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_5_lm-eval_global_step80108_2023-02-15-11-04-04_5shots_backup.json b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_5_lm-eval_global_step80108_2023-02-15-11-04-04_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..0b980e8b40156ef5badcb4720f1f9b73674485fb --- /dev/null +++ b/4b284b21bc4seed3/evaluation/rankeval/4b284b21bc4seed3_5_lm-eval_global_step80108_2023-02-15-11-04-04_5shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.361, + "acc_stderr": 0.015195720118175124 + }, + "anli_r2": { + "acc": 0.332, + "acc_stderr": 0.014899597242811475 + }, + "anli_r3": { + "acc": 0.3441666666666667, + "acc_stderr": 0.013720551062295755 + }, + "cb": { + "acc": 0.44642857142857145, + "acc_stderr": 0.06703189227942398, + "f1": 0.3336203597397627 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.4676359290977893, + "acc_stderr": 0.004979317515432522, + "acc_norm": 0.6258713403704441, + "acc_norm_stderr": 0.004829081532826523 + }, + "rte": { + "acc": 0.5054151624548736, + "acc_stderr": 0.030094698123239966 + }, + "winogrande": { + "acc": 0.5816890292028414, + "acc_stderr": 0.013863669961195908 + }, + "storycloze_2016": { + "acc": 0.721004810261892, + "acc_stderr": 0.010371620932652793 + }, + "boolq": { + "acc": 0.6152905198776758, + "acc_stderr": 0.008509403073229692 + }, + "arc_easy": { + "acc": 0.6245791245791246, + "acc_stderr": 0.0099362185271143, + "acc_norm": 0.6199494949494949, + "acc_norm_stderr": 0.009960175831493131 + }, + "arc_challenge": { + "acc": 0.30631399317406144, + "acc_stderr": 0.013470584417276513, + "acc_norm": 0.32337883959044367, + "acc_norm_stderr": 0.013669421630012122 + }, + "sciq": { + "acc": 0.913, + "acc_stderr": 0.008916866630745913, + "acc_norm": 0.904, + "acc_norm_stderr": 0.009320454434783217 + }, + "piqa": { + "acc": 0.7529923830250272, + "acc_stderr": 0.010062268140772629, + "acc_norm": 0.7540805223068553, + "acc_norm_stderr": 0.010047331865625184 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9a873ce90f5e8f57cc44f80dbc46580e4065187 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a253131dafd16de7ba2db71759749a5f2d5d8f49c1c05fd1ac4e597fb4088acb +size 199058647 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72c4eef28618380c406103cb8af12218eea18271 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2d4714a6e3d99335c07ed4aca729c6d232ac59e5a8a04af43703bb34b2877f1 +size 199058647 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae099a0e2f585093f2cf1e68825766bf274d636c --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8a9df10cb097c36dbf0edd00d5e4721a5abdd0ad1e9c03233920ca8cafdac34 +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce5406f5559530442aff98c216a1493a9e80522e --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcc338611857d7c8de68ed560675185464bc89d7efc1379d6ee784eda3f449b7 +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81c5f60379bb38929d6114fb1f6327614cd31df8 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c630f123a82178c6b3552a1c8b2eeb946963aacf2fee9e5a050d38ac6900472 +size 199058797 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b53a6957fbb3e9d00a3eb9c05faac8050e3a6b93 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a38efcd69cd4fbf1b653c2e1173205d8fc1e539b108909a1330e854d6b92e6ee +size 199058797 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a70cf9e7efe7af6a6d0aa5524d9dc3ba0c6832bd --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da57e5244a2f11b6c814c5f43bac4e793260fa171305599fa947f729ffe91bb9 +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77e5069fbb00249455a1de0167bc89f4d151d933 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59045555356713f5a597da7777bdfe1fb59ee1a2923a91d4bbb5f47c53698679 +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10e705cc1e2a09b35a104ced0f03dc95f9da4a0a --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cad25db6a6c63545cb7d7e100f7ac8fd52eb7c0a5363fa2a69cca201c78bfcac +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..601634f97cc162830fc967c3324040f0d34331af --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb553f72be9377eb439f0e71cb9b3e887d9f04fbaa7e91b06d48ee781a6b37a5 +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a00a4098d422e47a90b0201d383cf98457447246 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7592cf73d09bea3dae30ea2c896e3a76d44ae0c87329f4d13d1bd9e8ba68c483 +size 199058797 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d70444f8ba6b5497cb0b58080e16711f88fb917d --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e074e3148f2b1adf0985fbb5b4013e67016a5321f6751f5d7122de01fb22791 +size 199058797 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b45d8adf3d7347dd21db66fae0fa87bf2de397c --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f66505c378224a03daa2fedbb35c7d407b6f76fd7c4320a31e485b35972d4a0d +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0aa91b6455b467ce78634f3b41f2523aa900332d --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5cbee049c09b40e883085052bc4223fbf50d8d00ef2512a7279352c990b04e3 +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1863b23d7d61feb63e4f751d46372a340743369b --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae255536e3b4834dec69b2fccd4c7de5183e2cd158fda4afe71a858e204c96b6 +size 199058669 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c0677bf143aa593c9f0d186f4042d2be89370e4 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b5ceee3f414a6aeb019b574d1538e42df5ab18ab795079236094633135c28f1 +size 199058669 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a43b0a257ffa470b2ccf431c26c1b9f2666889d2 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53c2a2903eeaf4ad2e8a89931cb4b6530131323c2de8a86eaf65d936c93e301b +size 199058797 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41294df79902fbc7cbb24136c1e0d94eddc045af --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d16f21d8b9f3c5ed346c1d6ef69e17cee6f488ab006f63059eba3c8aee2772f +size 199058797 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70450181ed9b3d7b1b10a9b379607992807293fd --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2485b86f607891c86acf6d57bd829c04caf95267c2746eb2f7c91735725a949 +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a312c73b8afff458031c46a80915d16db90aa042 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0306858f7e4af2b1245889b12490caa40edd7ee9999b9e60380e7766b46649f +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..481e61985dc0a577415cc844c8140fbb4b8eadb6 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dec570e1187ea0e911cd8a408d2445da073138067914760097ee7a0da26cf682 +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66c3b95586575b1209bd6d43beb8f491a85d3f78 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b1474fc3c29017fbe6b0232ab12d77ee493512efb6658cc49392e982d5918ba +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b918aa62d35ca5d7ffebecf1e492e4503bfb143b --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52f673aa9adad78a3502ffd7c637236502222bebbc2b076071e36db74a2975c6 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf6c8aa813d332a0b40bf550acdc2aa460fe7f6c --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd55f6206c5df5c907ed314c5c5a931ba344f32ed04c7c543f44cb83eb9c1f3a +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd90ea6e4f69a49023ecdc8c92a2fae7601d5bc9 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb7d04e48357508733b0debd9a02864c5af40721ee90c7ff6e39515d45812ade +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11c3a60300ff068539e9edecc394b9ae3515e486 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0272325c25304ae613d3020f3f15cdb13e7cd57db78897df4da52e7c76b34fa9 +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98de3ac4c922c8d2b32e378dcfd6fef8266c5103 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb4ef0b8906b5ce351ff7e43d6e2362604f44fd51de7b78883b52a4cba1477e8 +size 199058797 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66e4a21cc9df197dd19f0c87b54695b960ec77a5 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:734bda90c0bb1f52b324010b1c5963161ceb9c2d8d78bb7e796c37e12e1c5a76 +size 199058797 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc9012c6e903035750885b08eaccfc50339400d7 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b03e32fd095b0bd83c8efb53720e2a3b4db04d8ad8493f6b15bafd74ba7634eb +size 199058605 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7f51e628b92373dc72d7dd1d53fad1635791698 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6222045abe88aacd2d91bad11b9feb6bf6ba5a8e7171a8acc8ff2f013d2f6ba +size 199058605 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f15d964c25f5e12e0c3e02f9d85ab9a0c73c373e --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a8e8266f19cfb41b390d23ecae3929b9873a13ae05dc8278b16b4dd07c15f1b +size 199058669 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e02bba43c2eaf01c838779e503c44d24300f38d0 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdf2fc21a61c4abbda990b79cf53adfa78fef3c55e29930602fcaa70286ab802 +size 199058669 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b51cd789745851cf14073266703c21290633db4a --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf4991c046b8e5c9a39f2c2734c723084bb5842030bebecd3d0de5a9437b3712 +size 199058797 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f988bc124564dcd6909b0585ceb6dbed57df3dd4 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d1ff06a3ff4579b177a2dfc4bb12e719003de474fcd43b72db2d1944258740d +size 199058797 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d19d9c0255a824de382547f27e8431ae603e9d00 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e51a03517c1bec0913fff8b5dd4e93a551e21c0906aae3ec4bd450ef0020c35d +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39b5afc7ad54f4b8332c9ae8b23af3d45ec1255b --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:855f781f3ac9cf329bfe1be58743905b26ebddef27c4368f9855931a4fe2d45b +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..914669a739b027b8054a57e2b9439111f354bf81 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a3f1523359de1fd04963be0a8e5abd676f7934e3e6a6b4c1f6ec18bba5ad6d8 +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1989e2f7fa311b0bc889a78155fb412a32db7efa --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0a71128bf3a20763ea93a315c62f46c2e47c2cfc51235e8cc93bae7ef7499b8 +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aba74c6670fd0e8e8070ba8baf1a490220ea85c2 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:263bc4b0bd2b288b54032dcc94b0dcec554782a330137723c829e71d25fcfab0 +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c35d1bde83159f7631003cd3bc50dc76a5ac8a77 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6093db05fd0448465ce8d45fa69d6de7794b72a1984abdbfa05be2f871734a6e +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ff03e62e77bdfeece6b6dc13c2352c06cfc568e --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cf4073e57553d34f6261c8b57750b88f232f84eb52b700f527eba5cfa699863 +size 199058797 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b37dc717d967bcc2098b173911279182869244a --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dfd19c487290a7b3a55aa89e50edc062405af54848afe022d86e60063b4c655 +size 199058797 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6457dd5aac1c4c2f826683bb3e6d4003b2cead1 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0321b1cbbcb96d1b886bd2737e8471f180e7174e0592995054180113a73a1c75 +size 199058669 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49b7f263c9e43079cb0434c8c8512059d40b5519 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69da2cc3563d1459136c5f39ffcd33b8c9c3a28d75eed375da1f717a603458f9 +size 199058669 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2bd298a31acf5db63fe199c425281a322f7da75 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33c9c763403367ac88b5d4ebf65d71058819715095596481c18f337900abb68e +size 199058850 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7405740ac559fface6532d1494b7be1a0f97fef5 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:685886a7ecdb481dfc217ef0fcde8f284ca8da5596da7c58cfcece26992bbbe7 +size 199058850 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60f54ce8bce49fa7382ff57fe7cc0ef511c416ec --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9ac77596495f8c96708900c240616366b675f24aa636cc83177f9ce7ccc40dd +size 199058669 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83b5026ce9389b60ab0b1f1d167130f0a5e7c305 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cede9ac16144e1d71f7c42a2147b6c24877a7d083f717dcb43e1bfc939c305cb +size 199058669 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19b3a89a223c8fa78a94c00f3e7c68b8edc1ae47 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bab68026edb49b1f268a578ae499c994563b9dd885803b604fb7812eec5cce5d +size 199058797 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2564a4556809b3dbf39a56875213109cc79b9404 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47f7cb3d4f87256f860e29f2f874b17445e52a32e5f2d2d34093d885b075fb9e +size 199058797 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34243fe40c5308a2c107ba90955a849943fc825b --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6065b3c475e16c302dcea56159c1083f7d19d641186c8c1bdf7052b86a7b70f +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a676912792701c9f1e5831a56f25291cbe714591 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:724d2c75296dcd241f3ac2a0b0adf8db88df13822ed1bb0c4aa0ccd2e878c359 +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12c0ce9453b01650ce459865ac2e45be5e4b1d38 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b4f6a33d6d4b866484fe340ec80ab315b045a4c9d2fce208614f858193b0389 +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50581319bb504667c452d7c3a716ba13de13d332 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8b883b70fdca5026af7cd3a4bd8fa3c44040bce28ca91acf9e5652b6df47fde +size 199058733 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c337ed3ac0e79f7ff19651d99367ddbbb4f36550 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89ac64a21dfdfe5e7e0955fca15a446d7a903669ff3060b98f744da906e4c7fa +size 199058669 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2a6c8630706b6c1e41d1c29fb162e68f1009b7c --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97c397658be18e70f6a1cd8f1467eed8d9c1232878ec49953bf726d0d9182740 +size 199058669 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0c367f1cbf0b499c595b0f491106ee704f8eeb0 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cc492f4278cb5f1236da0ccc129f5e991706d49724ce3c7cdd86b62ec12725d +size 199058925 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da808b1c1d5045af0b9a3acce2fc3bf755372257 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e5cdbe2c481d3c7db8cf35a693a51073c246d020249103ab6c857b73594e5fd +size 199058925 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f58cf8b901754ee652bf4c3442f62e568d45d030 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d604a0002fffa95ada2659063a68a725ea54b8532f408065a95e01a5e873f4a3 +size 199058605 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad722c7ca795a4c3a34b87e1e12f917d25ab57a5 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:159044797bec43a32471c8f128d8c7c9fb96cfa5ecaf75ca39e6daf8a057cb39 +size 199058605 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..728da0e4953e424a6f71e0d00e39c1ca9625787f --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a197cb9b59d9017a10cd9ff5194191825397517f937b19ae0f75e4382d59cbce +size 199058605 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bb6fde90f87486e46285dbccd9c5124c7c75533 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21d4bed433f01270c7b217449f4964d17c3b4ceb32172fcf8eb8de90c860e6a7 +size 199058605 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50c0c26fde2c072063a5cf03512a4671b33606ed --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d67ab51aeecfee171eccdee71fd8a9e3887850f344b99e2d183925cec4ebe94 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20db59524e86ed0a0e322e4f2ab4436a9cb328fe --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:862e42d0718cdbded8ec30657295005ca23df25338a248835cb772b137acf772 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c66a5c2f0e7d142d00ea5bf29c2a2cb5ed502056 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acc3dff3b0fcf2b91b9628147b9cfbcb693ce79f28b9a36a7486e84595ee7e48 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a005b76821d34d6e4e9a29b900a290129c74ed8 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cdc177c29206f4f0ab3b6c8452206acf09ba5ead0dbaab3e48e2bee43bad5d5 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c213d3f4e0fb56d625cf94e7bda828f9436d4409 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0eccbe974e97c175052e993420140bef2697947d10b3a804e61f213f56c957d4 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0cb83d3e7ae4f374e294b92d24bca3d5aff4594 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7e8d6ffc1e93eea0caef4cbf1ded8920bd3caee90a64d4627f94406d1bfb442 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..52e5163e732564e7f7cb2695165a44f1ff37fe63 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c327857bc3bea26d02a60a1a9668c622820406f5b95e287ade54b0e86349699b +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c065ec4dfc35043ab60e4c506a7f72590db283b --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:968d0e956d084a2143150feda3a50eb696a124ec891428880ecf1eaa7ae38e3f +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9f3bf0cc7851eb2fdc39e33496921f3322f3b81 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:292e2b2661e2804fda30a1489ab35bacff38e5376953ac431b3cd42169bb441c +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d46f358960b0d2144c5ff6fa6244387bf114c859 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:457e1685611c5d3f2e18b3e2607f7214326b709207e02c7d3b2c0b10789f9822 +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10042040144c38a1155a9575b203374b5da0077d --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeaacfe65762fa8e9d05a7eb4445715c03d60f34b7fd63ad3cc261cce60e7913 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd000669e210aca0ff726e38e2622a2f3ce105bf --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:126add8f7cd8be9feff1d804d68cc26661b70192d955798ad79ef34e69e66a03 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..729d2121243b5c978a051fdb4566f6238edd291c --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c1710ec7a276debd15bccbf4298231511fd22d7e79b031d95549d4de29dafa5 +size 199058978 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e48bdd123653b908bb1625580f30ff070ce26c3 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c8acf942babdc1053a2018d1d987e340274a2beac995201584494bf72dea0bf +size 199058978 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a5eb31449c196ff4d91a96598f4c992929e56cd --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2612de77d0c213d1ab924fdd4f43a03c400e29098ad3c8cf4e67e1b88bde2eb8 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aeb87dceb3ac6a00eacb17ab67fabdc54a74962f --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40ce15bcf3044a584bd5472b53447cad23cb8f17b9b5796261da9ee868269609 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..769830a66e19877bd8ed99144312e6981b3c9040 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f65c15e3160954e7a0dff21ca5e0d4e7b7b667046d125ef92bf9be0062a34166 +size 199058647 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d164317465606b113b6890fc84ead9f1e39f0eae --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f698fa0e3a3fb55091169b00369f42587dd87f4604c60f59c91fc8f69e605b4 +size 199058647 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..156cf105fab834b2774894164e39a1e6f7605f40 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56922e9ffe36b70796d051b61bad5ab47c29393e7f376021acb29888478e3daa +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7638589a16f389cfb6157b1ed593f6e78714f2c --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82628288db6e221d660fc226cfd8c56bae50b51f9e6609f58f0b7244fd8bdf62 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78fe6e894317176fd51b624944e0e912ed8aacef --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb4a1a16f3d1f6abce6a5c4cc82e3a8fa82eb74baec490500f861277be298a8d +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72dfbdc5040628cab275fd1dd2bcf97a56f043dc --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ea2769bf960bc9f4a7162df9bd3c1c0ea86a287baf9495e18ec969ccb6ab5ee +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fc38607100f38eea7828977117a93c87251eb77 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba4f1b6714a15ba9398f335a15425eddf99e8ca0b494620e975631b4a891cfd6 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fa67617fc3c318950e814cc69844116a8229857 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e73fca0f2906a4f33e5d349101392ba64e222b49513e36994bbb50bdbfaec06 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b07c89bae686e24634079012cb3f104518515ac5 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dbc0e7aea8352ccdd53cd5c982b390963bf1225877cd49fadc77116e8f6b453 +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d28a6786b814246034281d0ddc970fb9f6ea0a83 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b09cdb13a48129f548b3975ec07697849921c54c558a0bb889da242dc7fe4e2 +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55ae8a6a60f11e8ec2107f7894e60b614cc597fc --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ec6eb9e193f58b63677e0276e7701530405d46a2c54b80d9517d56511dc1b96 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4622c8dd2124a0c9f96b2d33906da49d57e7f893 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03db2f9f1d3c1cf05042fbef608f07f59987cbd663ee6cc915a18dcff40554c3 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8f881fbcd0c00719f15a04c13114501f5e6d4e6 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c676a85c240551640b3896526bd4b2facf508607551c798a8aaf5dc0e9dcefab +size 199058850 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ea6d66860b91f4d32f48ccf5cf8e0d863b3113c --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fb4eddf7ab475534ca8f522ac41309739007343141fbd8d146ea4733e9e7eae +size 199058850 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5aa5a08b0ec51198a3385b2dc3826cba0e3f1cff --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1158eff916208385a30839f7bfcd3277a1a6f35cf1c546dd5d0297ddb41ccc08 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8f0ad7e96d3da4dba10aec2826078437995c2da --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37c904dfee5c4a654753371f449b0ea66fc0ff755e6775344903e2932f7d2b77 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cffaabc0a69b2a9ac860e9e28580f0332a881e40 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7557fdfae520a7adaa5dfeaa948fcf92369de6d90b116a0e1d683b48b29683cf +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a4bcc0da83ac8dede052a5958508c8dcd6eaae8 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e510fbfca79378daaa0bbe81d3e499e3c463d54622fd273f34b139acbf03136d +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45c6a47c375963c025494495840a077f4d54f82e --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:960a03672068af8892ee6a71cf4a33dc9b698cbd0fc962305e629495fb01736d +size 199058594 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..565e27b90f4a605f7be3183d12669a04c6f016c9 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70d13f75439c32426db58736afebae71ae65a3b1b2f4ccee59da344ac37eb107 +size 199058594 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e40e63ed72c7ac0f0d2c3b115eebce19be53ce37 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db72171482cf79a267549aead8809e76caa7cb359fc12ee9068948f73e8f88fd +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9baf7916798779464efae95c8feac0e0f126505b --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dd0f5fdbd42c638528271a377199840c1c71f921953798be348fa17121c912b +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43a50e0da449b4594e32cef9fd2df7ec6e889ce2 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46a36f0a8821448f660c1f0e607e3d62a9ca191e369d6d453fdf511ef9544b87 +size 199058711 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54b98b12887a662a8ca380e0bd9736c3cc6272eb --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2acb31779845c922c6343df4b14a1a957d69f3e3a941c0fe2af21fe7af435991 +size 199058711 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f019bf682c747f7c923af41a74038fe9faf2c77d --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8624c04229a4f2992af501a320d76fb7c60a4cdcf8fc131a18c662bd7e5a41a +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9e29e2721b7d22ea0f6d91c1e2534005e1e8381 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:784746dac7c25e17e4570a28ee0e1fdea2397f3a7f27ae07a4c2bd93b9bff90c +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f10395422a8618c14c5463b2362a3e2305a9cc0 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2251c9da4c825e41113abce96b7cf5694e7c90210d9730248865d707a6722dc +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6807b1619ff7e829030771ae1e1aa634f0562fc8 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f255344604749b2ca3f7cfb605737b9574f9eefdab1142a2ab3d7262bdba740 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c94b9607fb77e08a0eb07369d9b81d4c12465f66 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd69dc5524d9974f59d22a3cfe9d3bf6b72db424d4c7d2f318a317e3eeac1191 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c37c9a457516d77b9c899548bf2136c8715d7ac9 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7762a80123173c483433dc0915b2a45f09f47e2d75751fa99974a78961779cbc +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7ecee6d1998497921ae4bb2957774d64b556cad --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:057d4def3306a18ded1501ab0fffdea280fb09f936798b54a111de734d279eea +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9be819bdded6de766c909f7805c6c132da9bf90 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f629b8010270e69b831acbcde74960674d57868ba32240fae1ae1a997a44a544 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77a78d7780f75e1693c25a447261eb408c4a7544 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a82b386ffe973057cc886307244f675ac18aeb7dceec9e65e9b9869df3f4c540 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c83077b05f0d49a57fd1418e5607ce4823810f6 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b33f80fe1df49a10a8a38bb3fd7d078effc50aace734945e6464901b526a267 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dcaf0ce7c01e8def52ff9f6ab9e2f60dd3e6b89 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c69259c00d506ce917487d109dabe3708bf79a4376ab94b94f7ad121a7fe403 +size 199058594 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2fa6e032bfd7fed544f58150ce8621e8d9785c2 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:080ebe5cf4b5bbb8c2f18d4ab1b914a5d48cc0f045834ba4a0e77d4e81f47c02 +size 199058594 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00b99e0dc254a2a12883d9ca91f304f7a3677d85 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56855a9785b8caef80ddf5deb1332c6e6f86378da8c391b2a4b5ae10bc655087 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c8db868783208db8f6b0718ca6bddbd2fd447db --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc3ca9189d8b2c246a2773114b5eb47e16a4d5be7f39c6d62b69850204939ad0 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd2718052c2a8ea0754844599071188df2202d76 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efe3e0e42dc1340f9cf9c947421cbd92c3e239820ed875c9106b16463026f75e +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc865082d81a3bbb068188388b0852f33bfc77e1 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5cabe44c88241f1bd236b3eb545737762ce76ad08862616197178ffd9b5b61b +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3476ecac5184fbe8775748aff5fe621373d09fe --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d76aec01e1fb4ca73feaecaae60e21ccd70cb1d4b638f0eace3beeb0076652d +size 199058850 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff24dbc387bfa189f5278d32edbfa7e72618dbfd --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5ece5cfc6153acb066d06f4385cd9be264fe9a34bf7bd1ddbf94e6536adf524 +size 199058850 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dcfade1804ce653465b72951435f7acaba5004a --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3ccf341bc8f47de6befd2912eed83f79908f8168b0b9a863944df0c5ba99e1a +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42efff5d6a1bf4f1ba0aa7696f6955741f83e969 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bae77452a968049e521ba2a4c0123ee8884c21b8a79147387ef39976df5728f +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a062120ae2be29fe3738d9d39fde9e597cac1656 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad04217caf59ce11433cc7a227e10addc2b3e4f02a90a56f291dd6004c0b9392 +size 199058647 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49726acb398c7176f20c5e128586c6d51b2939bc --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b624506a07c0ae19f5ed92a7e3acba144e97071b45e8c2b5079ddadf132a3aff +size 199058647 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5d91306305c6ce3ee400223d7c2f9311d4ee57d --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e5c269b6cf0ed33827e049dfccad3edf668ef70e5dfcd0d292dc1148204bcce +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a90e3278ab4ceabc9be44874dc1a02127c4dc886 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07206e975c299c7404347e3375e3d48b5bb5f570680cbf2f03f8b3a0acec82cd +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94ceb260822a57cfcd3c458ed85f8def2a545c92 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b71edb50ddf2ebeba8d14fa098e6d264e8e9cc01e0f50a69adfdff9d9a09f913 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2c70c056344a249e82532b1ae73652a54f983e8 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a48653c248e6e3515cd75a4c17d83b10ce31be2e9d274229a8fc4f27ad38b46 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28f89a6bc71b38e03f8a27616f17cc180fced379 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bf309bc17507a495f47dec6dbac5aef6577b494aa4f5fdcf60854c0c0d4190f +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc7fe0c096d4e798a792c9a1042fe85ec7345ef2 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a235f0ca1da869aab24bd0059498564f0ca5240a011d5303e824d985d2c38f56 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb090f96b7899e25eef1bcfae3cdca2bdea69982 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e83ed1ac8815dc4ef0a24ceb4ecb5a3046dd45bac1684936752f2689412e81b9 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96013452b380af0c860d45513a5af035cdec8710 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b788e76f46693f397522026f36cd299092167100aefbf812a247b016527235d6 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd9426236f93394bc803f744232e720b75568a75 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa164b456e2959ca4b10207a171a671f92503bb379d3fc65d894d1587fe2a88a +size 199058850 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcc459ca6df0a71e2e90638fa9dff7862c6fd895 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17f576ff91826f20c7993b97c0247e7911a50ef282b94497f5efa092c2d120d4 +size 199058850 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6298d30108dd2f43d2eb5a35ff9e8586734b09a6 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b40c921713020b7a46265c5db2a6aa5430c63692122b914e05151a3f8026482f +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c7d43bef03e13d00525f3f8bec4d1a11ac63b39 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2598cc2cba34ad0a2c376da1a8a65bb6805e6b0a6ee341c5ce82a1da61da7c75 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b2988b2da9e427fd6e83bae3e42442348d8616d --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18da42d4d0691bc76f9266ea517d5fb7fd5d43a1db1179cb50a16e353d98b448 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..311de1857c207a55941f74a3bfb1709bd8bdc2fa --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7ab6abe3530498199f3ff5db6839b5288ba0257903742630e0d66827d9e7337 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02f53f4c2226f2a1f46a0e105758a0b19ced6ce5 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19155d506fd18c51114e364ccc8401df77527720e48c218a832b740a0be80c12 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77d31eff8c683d13dd16a0e40461614bf04bcfac --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b695d7bc1bbe00267daf16800cc7c46188140e1fbee93ffa7bee56cecd438ed +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ad3541c15c10b645bd0cc5d2e6289ac66da49c8 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6762669fc98e327a427b420fc7f694acc65ff6b34f371b17c5ed73192da7c740 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f6ba35c979d249292297c099c1b0140183f16fa --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bd87428efaf52f877b1bb591308a988c22a04aa99080f990e813cb01e951bb8 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e84b90062f55529f4abdcf69be2ad5c013aa3e0e --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9c1f7e0220caf63f2209b8b9e671d2a574066ab3ee9c0f85019589f43f8b550 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c5d41fcb180ada6ea115daa9b7a382516610580 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b4a1b76d1acc8fdcce0cc32a867d1e117324e91a5d1127222f5973da385e335 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74a0181cc0f8f0c800042c7e20a38ee9983f3cfc --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67880ed4bff45140e41a25d1d5c8b172936102d4861762a996a3d1b90dadf453 +size 199058775 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3049d6dc0c0867a5db3a3aa3b0a6850182473a5 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e99b8e32095f357548d4727f253c67640c9f2ff6034002b8f9554a70c86ec6f +size 199058775 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a12e3b75b51aa312a97c5e8be91643423c4480f --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:836e74e93cbf8d4134ccc9c312d1532f1fafb31bf5dc8d208acf8017eee9b2f3 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2be9fd6e22900cc0e25a48cfa5244b0531e09aa0 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ec5e0660589bc52ce985c5ad210d0162461671c66ca9cb3c3d51240741f8e20 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..781055b265284ce145049fb739154ee27d5c95b6 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91f337abfcbcfda74f752bba6b2a96de012611f128db99aa021a5661224a6859 +size 199058850 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed1f09fda51fd25390aa17621fcc04013c6755ac --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f95ec61a072a69d1160f34e3dcc4790697b0119d1f5940fa32a04356468bb9f +size 199058850 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..571c418ceaeb8ac60ea5df203af541f7d0261db6 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57c4d99c098e0f67c661161d42e99ca51446b967e8eba21ec000fb788d9edbed +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4368899d18b7c6eff039e3ed16fb97f3c9143c7 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e36effc2f1bde4a648dadf32e6edf5ad92b932cad5a71c4fb602ca0a9ae8e74 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b340a5ab5e5984c1f0374671715142b8de0f6b4f --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af3094ee36e56fc277897dd4bf7b629bef57380dc0e7086c361428898a174b4e +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ecb3ac5245c0d730412f2433d1081016ff7d75c --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6ce5e1e997de03f2332328223d0f3f1f65504d96b28cfc9213640266cf91dde +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df3e3ab3d123d936dde79770255da781000042f0 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03b838176d28f3d53bb4d6f964b75848820609d080990efc0f5f99fa056fbd69 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64085f1818e50ca6ceb232d14d999d0875baeb0b --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aed783e80d34fc61ce991bcf592c062da741e46239a0717bdb292255a2aa9a1c +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f2f034388659e7e1d4fe88824db36329b3b6108 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fe34da3fa3a849a21cfc61d368d8cf57b398416760df7ccbaf0133ac9f14b34 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..701d07c9716037a7a6e698d9434d83e5d0a20852 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e209dc9ec73983a65ff38e877ff66a8dfa5bfbdbcb27cf3b527ca90f41aba55 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4477ec22e764e105a49161d5edded7471c926fc9 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eebf0732687e38873fbbea2be9c0741ce18c47290b6276752d151fd607b1f46d +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff48409e1824622593b5170bb4e2bb4aa3ef1cfc --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fa3fa1c7a80c92d0fcd5b2df6152a75ec565ab79b8e63a2de1ebda1a9d7c739 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8847c69c2a4517640abb6978203039eb64168df8 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd8360e9007d107de3d82aa0e8f8383669eb07c63756c0a955c93848a6e6ef4d +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e37ab94fc3d6e8c8236a5692c156729de03c529a --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94f4f95b40373b8ab0396fce1daf849414cd79620cc871549bfb606ae27bead2 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30d9cc970db9ec28933eef6835e373931068c615 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49b7588732fb608b97dd0ddf9803a06a1e3444b323c4d5ab41422234fdaa12fb +size 199058914 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18ce7c4cf2a9b8abfd128cb47b17f3da8a4ce4c1 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84263595aa1ab6e110d7c264aa9d22c9616083214e55d540047b372bdc3d0c27 +size 199058914 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b87db6de4c045ba3433dae4a8ef52ce9ebd1590f --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:200728ac277db082ae3761fbfeec775b8a1eca59bc0cc1a4d878f9f1bbfe443d +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b24d759cba07b2a920e9e7a83bce73491539e842 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bb47d479b4dc981ad3e439e3db4740ccfca003a02024bf941bfa73b0234784c +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91fc3d9c910423e3d7d9c2d3a5ccc491e4a8e476 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15a2d47fe27fd07c9a2bdcc1d8c76ff13ff4e1a3abfa34b1e9ae39bd4c1db5c9 +size 199058711 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..942df69257dd3ff6ef979416c08ef15a6dbd1ac3 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e756e1681a34d97fd9403a8456deb2abd54ac0c728e422bc9dd99778885082eb +size 199058711 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d457bbe78ac533bbfacb153beb9a29c2ee09d67 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08c8f228933d373864179df81abf7bb12e655d154757d488b25b5b3c927f6e9f +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48ed3d43748ce087aba2830c03d56ec370c5025d --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f64e4d42f2c884bb4928e11dee6fdc18f0eca1f57f33e68ff6f7de74088f9538 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83a0c433ed19e3f36eaf0be19599cf2c9f48f67d --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:876e19e104d971f3360d32e7cc14fd6eaa1263b47954965d8efede3e853852ee +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..924dfd46140f2c514308b6d30f72371654124c2e --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b146a626095864d5da76a91664e774053d0ec93474777e6a1a9a80c9a036728f +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..838106286338f1f0af93605510c56f22e081bb7e --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88cec3cbbe0ddfcae2981a09a4c614df5b053733e8cab0f463dc4c86c24ef004 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcbb05e9545fa30ffda4e8d265c277dc18230066 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:794633578d2cee2ee08cbfa277ea7bb1d13453fac57de597db0f1326b1eeb6c6 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a4c879995c94b38ed201dfc69d4106592ba27cb --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:757c49f751385d1f55b13a69ee5c26fdb497078408601ac1c679ea55cfa3c006 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..272cb03b83c10d7e5d46acde3c743fa25227d7bd --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e50d795dc17521bf71b0521e596dfe99c8d51374ecbf70ff5f796bfda1fc401 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ad14e2d1868c87212623025a5a6d4d56c83dac4 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f426519ea88cbe22232e01522ef560ded24708cdad62a1c3c597804b9ef8a38a +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c1bd769b9970dbbc60c57ec7131d9687e2b726a --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d59a357420705f0c132712da71807b3eaf9da896c7db36d78d95205abc95482c +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6853b53faea2f47e1e96d1cc4e89bcb5070851d1 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeaff5aab5f057848595c4b1dc96c9ba46b27decd983b3e47733ee159e6b0813 +size 199058850 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3796edba2aacd8e9190beca0b2904e73c96f016b --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c899b43a133c8ead27118ffb40ce072a4c757f6c15cbc252cd32a7499b419bf +size 199058850 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bda075c5b443d4a0c460eb2cc5379708c3624ac --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fa22a04b4d3a28b7a395f1ad36dd2609706628ed60cd353d6d3f8da4d479f44 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..108e8d92060a47a4688487e04a17f3a8f4ecc389 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff76705a57a2ab8d1b3aa1ca53939089f91296b9b705d27a02822299c0c16b4b +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73870a361305b85223d7ff477efeb16470dcd1e5 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de13a714354e4dc6d8dad991d758c10780967cb1fce406122832e9e268b151e2 +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8641e8bb0d2bb731e324f3440b2a4b5c50f950f --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eebaafc0ea951ef84671b80e271f475efcfb246c53a85e2ac35aa486239e048 +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea4cd244451037807a94aaccabfe0d18bf41677f --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f46c971343b04914b04f7f544dca0d627a534bc4f8189aa8dd700d3ac592f2d +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2414cfb9843c96e7dc6f753b1d87b0f5b823fb5 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdcbc30bc1c69e114a849eecf3e6c56e4db13360b708ab324ecee002dd92d14f +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4c6599b783e1c9bc4dda9b4ca2a6b866ac4a680 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fca92f0c7f06aa6063aabba5a626827f66f239167fc2bc0873191f4f01af36e +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9729f107e24621f55b98f7453871b5fd031800c9 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6048b032537ea0438536f13590a9fcb7bdcd20d95b5912331854fcf64e7a912 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40dec6a9c7bb372397c64f71104afb3cb4b93879 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7082ddabe8f2006e8ee119054945c7a9808e3a83c7b9a4bba6a03c6b8ee0f46b +size 199058647 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03d8366eda459c679de43fdeee368e8875333b18 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f95a7c21a5cc701e1081a9c896c69a1a94c16239724df7dc235766dcafbd6f2d +size 199058647 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2be10a686763fee33b26e20ca23bbba0e3fca99 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39d92948f973e4a6ed898c55c962e7235cef38bc4b69958672bb92342c406c78 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2941c05e62d935f455791de2e90a571b84d13dbb --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edcb5a0e7eeb03148d191bab7c8372709731918fb1e5fd252d08a1553574561b +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..761e8615a6c97f46d31600a7c82c17b5aa54f8f8 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a05f88f24e909620767dd4b1c51cdfa712b4fc12435ecfb9ab9c711180d69fbe +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd84d9dfbe6baeb83fb2bb24994e8bb10e441420 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04140bf6eb12eadec3aa515439fc6cceb69ac7d609412ab78d31306e3b64d09f +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d75ed6dfcdfd7990ef2c85ca375626eec6ff3996 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d3e500f3b8666ab6c5d52476998ae287eabe2e341f47f1602f44051690e9440 +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfe665fb1b30627ecb39c3437059e4704200059f --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cbd3fa5cf401a7493fe2731bf6ea174c3a4805d7a6bacafecc857a1761e4f5c +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9847594126ac17b86829ac30d63aa4378f3410be --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84b42c6a9da981d5686242e8d748b2337a05b01ebce6357e03e8c08aac1f6f0a +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be63b60e925a1d0bd3f6045888a28aacfb4e72a2 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7254c6c53ded80cc34c21c3b05a5bbebb18b1ac265d3b93bd7d5f87c0f09e688 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22a9edb330da334dc3f49a23b4ec98ac0512e045 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f117dd4f7bbfd2280b787cbe608883113beefb5af1d8d583312d8e71de9f4fd6 +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41b7ac55272a4a8e631a6dacfe8c6ad00997151a --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d4223b5be3f44ec7a0800df642748aedaea06299db7a050276ff6f85feaa287 +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b927290896364001107c7fbe0892efed76400c19 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc020cce1bdfdb7dc282ffafde41a33657594894b46cf92ccc10cc7a911a5c3b +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31e70c10556d1d80bd909a55e3d9e26a45b2bd3e --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88ea29d14ed17c1ac645f36732a60d6685c351dab64d41866ec035cbc3d47d20 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2deefa27b5dfe517b3db0a77cc3e40978d5511af --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a3364d2eaf49227c575fe4cc5e9cd300ecb425fe8c742255e74900a2fef95f3 +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3aaff968493e8361730ad3822f386d736f59acfe --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e162aba4d3ef4a8d6107ac988367382934508ff6039dabae2452c83d969fed97 +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9ca9c72a4ab68053fb0a44cd6277f8f6f25fca1 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d492da8c8e3b9a473b390d6ca08cd60d1a127b9c14671d33b7c6e21d9d153b4 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61850b0c7993c98a79d77ad7857c7669a3982150 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b5105200af5c5daade5fd561a94f0139977a589f890f5bf67c03731cb3eb74c +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d0d4b4e921e641762e04699dc8e0765c0c13399 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89ccba039d70f3c496b1672557b75b0281e2f786590f7662f7c803c2e8bccbd9 +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51d9646ddc627bf685679df1740aa19be3849952 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da2ac6e69ae497c5bfbf8a31607daee0a38f05a446df125f13688240fca080a5 +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4c16b0f603e8f85f14ac067126d3bc5e790cd28 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acc31795fbf44be9cb68017c2ebe3544891ec8e0a24c082697269d332bd9dce5 +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8184f9f585012019951791f668e69d2f18e6fed4 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa29ff43c1e3001ab23c9cc0c93e52957175479b989944c3c5684ad148ed42ca +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c74d25e46d5ccac5fd1db3ec8db1374b2ffb19a --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78f9fed6e469d98124b90046fd0110886530b58fd697eec7900d2c56e4422758 +size 199058647 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5b5c7d706b6456b4e187036b7f93670a3c75998 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e47409f8a1c2848a230c6cd10bfd9b14c52b7c6d8e4a219004215dcd28077ff +size 199058647 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22f8c7406098cd63c2a7f94c5bd5da7cad96813c --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c1a2132eaf68049ccd3ac0103f4cb142f5f4c5b14fc6ce9bc035880121572e9 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29474a75c92e3df75fcea0714a4f3597a9ef80ce --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7516c7512add4ee77cc39bb0f86a6f357a070fe79591c61d6680f425c937f7f2 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3264da4d88d2907007ea3bffb94e5a3adbf5b61 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e92b2d227644e98fccb1275b0f9d1957e9e41ce61b84fb98e5f656dc14c41c5 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..900face4fb647a79e269b92af47f5b6250f626bb --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bcc1920a7666c42cbe8e07cdc950f87ddf92e4a3aaa9688cf8d6df942b8b358 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0396c5f8a7d134cda23d92fb78f8d9ad7682aab --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:146521184631f36e88de82f9fc3d9dd7aec32c15d4410910bf8af04a6dfba63c +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a2daf27ad5782fe545b24db506df431a06b8bec --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a4296d8934ebd6cf6bac0e9b16e9d7f0afa2871e911f796e23cd4248c38ea52 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a2468ff3f84a443c8a3b290e5e80f05670520d9 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db2c0f032a96d36e5b9e8b60fc31505e538d8d072d0130ffef707125e1fb3630 +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38ff000fe40ed0a46ae98aa866edf48c1c7b7ba2 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b892b7f1e74624b4488f21823b0948a4a1f58e89d0e7551b30edb18c2ba1d21 +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aaf8151d19e93c5e6599ab515d19d9b766d73b42 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:703469381ecbedfd0244d57a6d66b92e3a8ecfab233c199d394c0d77a5c6b335 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07be0f1a1082675740324ae4d8f675410a8125cd --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08a89a46a4380ac0f6612d69ec9c9b75615149729375da1309b8de367e76abcc +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56135fd9df3dc2698fb054c18485036e0a565ca9 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:868cc53aac45008ec41df17e82c548d746ab12c200e70461265ed534ee15f88e +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..894261683c4a42bc2d74b91df8989558587a550f --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f0f7ecc53840c00562576a850eb40fd116f7cba4e8525b8cd445f77c6ac1874 +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3d850f450bdf68235c72022608a71efff8a9239 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2df832299eec2c6182ed44368e2097e3278c2533f4d63310de345c524d68799e +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9f3efc84233ded1fe09ab71e6d66ad18145ea93 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a7e9667420237518936b878e0b4f4a61fee3f19f2802513d8c18f71610ec109 +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7fe61ca569f140259e74d15a0731c140a6a029f --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c8f38e4773a7634520a6715c18c29a74d235e2e9a66036d3e57662b8edaa96b +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75e128fec0c00509b16854ee8611db550517a7da --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f53a0757f87b397e1df89b233212382caa6379bc42bdeaa8d656d4c9df73b065 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6feaa0dd476881c7985a2be0f680b7d8c320c372 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c9c37692578b9bb1f2ff571b024a67e41f11cc5feb6f7472fcd01c5e8742746 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14de066583f18015233ed1cd7018eeceb8c35fc1 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca72d2598929461ad5d86013efc5998e90c96aecb11168cdff5a8d15ee3daa36 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c552a2c033457ed6d550f516e255ce4742c04b22 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ff1a1a5d25f4fb913430c698ba721f3b14d5f545089cf979ab2f079f661dbf2 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..afbd66c9c7ba94c08a900fba5e5b1676c34a4e47 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98e24ca013abecf8af2ffaeecc82d5f04b941755ea3859d61449c3e79cd88b85 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef4b09474d8632860b9a2bb05dd778a86866ae3c --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d71b235dd6530f25419f1149d8142d10ee3fb05cf3d96d022dd74603304527f +size 199058647 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..111851cf88ff01a138a739e5d429a1564557cea5 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29c1506c1a48d56be2e5542f460b603f6086b4a651a34fbae2876151e4c28baf +size 199058647 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37c1749ec30f9afb858e7dc62ad1435549b19c1f --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b10d4ea229120d4fe287105921a4d3343a4e6f52dfe4bd5f338e5c0cb7c048e1 +size 199058850 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33064c76fe319a4d5cd9bad40988e1b0fedd7775 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6579c87eb49398d7f8764c0419214d82075bc3e23522eca8e83f830f5ee808db +size 199058850 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..446c421139acdaca22b887b482523359d57938bf --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bbe2bd4bf4346fecfd5c76cd024a5422f553d90ffc594d27c8f0a2f13eaea74 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..002360a42ded1c41149cccf6c0c89bb9b92c36e2 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f1e13c3ae42f0f4fa3a05bd20f16cad4c24c6be100d2026ffae0f0d8c77590d +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a527ef2ebfd6dd43dc598f73af672d144808f3a1 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1f42e6b435babf53ff3a8115f0cc5022f80ac0699fdd6f4ff29ebeb55bca7f7 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e82bfe3e078926821ebec4f12572fc771bddd5db --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a9082fd4e148e4bd0e00064514f5b9b664d9736441eaeec35f326316ff7f095 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e4a6dde9aa05a5fa28cab452a46cf895d99c045 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c356f2313284588a1cc5c9e1601045e47a6b106216778e66f23caf4bdaacbb66 +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05e8f1978d91372e7b0adf0aebc9ddc8c36e5d1b --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10dc3e2436331e83a26263be6a847bded7efdfa1f309689e78fc0455036e5e70 +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3820e80997af9e0d8522cb28585a8cf7d432fba --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0988781ff07090a5a20e9a51f91a2e78eb8b963ee887b78d02255c5a4efa22c2 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f51a69eaf7c6319a9431842ae498d70ccd6f49eb --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:735920eb93a385f9fd2166d8907c1d781fa15c1d943d158754e012a34380e03c +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd5dc6a1ed2666b9591dbd3c8eae807e4ec8e197 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a95be81073268370f808f32abde2e500485c2ce02ab8cfdd6dd6acd7138baeb +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ac52dd02a41f9c43495d3d3da3d55fb78e634c5 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ac8d4e7e853bffa2e13489e8450d75fc7a2a742cfc3ebcf07ed5de230809b72 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5f5752b2b16839a0ea4e8fbb31579537559d331 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:055280b1a91c1bd4bf10a090ef1dc17268e18d41f0c8ea29054e52dbf9e9dd68 +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4894013dc396d04f673d30a45eeec03ba350b9c6 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f810dadec3b390f48b5883333ff1d1c32c7caeea8c6da735d5e47899be031bd +size 199058722 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90bfd1454b68e5d4d4bd9e25ed1f357817b355ae --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edd680250cb9395f471d7e9e986e9401e5416b7f7730555bd5c48406ec55dcf7 +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b73a5bf95993d323cf3c4c59350ff0afd7de8472 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3228e8cfd8e49061e31ff1aa78e25b5d9dae8063cb4ea051f52f74abafbf30af +size 199058786 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e939ae53216b14b1f45d92ec18506255957832a --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d95de6aad7ab23d911fcd971d6291523fa4e8496f8183f5354388a2aee2a461 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7109ef5a7007c4f168ec918f79e9996ddcf59f0 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:322db3d0b00c25d8cd25c6d5a24dc1818746031a3b0d736e2630cb859dd2ef97 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9219214d0b18ee245b77358664df438935d7302d --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5944db6404dfeb539f2e0778ee4364fb46da7b52b563b2c53f4518733873018 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..522f2f3577094bbe0c2976ac2652f02a42e15c4d --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:247a1106c0c16578862e15974049d0398a56a689804c59ecd9c82d367cad8f95 +size 199058658 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d1e5b36ed16d408e1b66b8da55b53589641a9d3 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:506f770a8a352b8cb9691928147d86bac82e07a8b4ea903c3043a3de25d6de36 +size 199058839 diff --git a/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..badfc577aef91dcf1b02103f41a2807f3af866fd --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a33b02ff40dbc6b5d8b85f554f09b17a44c3e13e04e099394c1eb58f39fc13c +size 199058839 diff --git a/4b284b21bc4seed3/global_step80108/layer_01-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7e779b2cbddf19fa873ea4576d70f6a641b4004 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3df9521a2db7792c702055204f10111f0a06822baee0b27782d33ec7cbd19ecf +size 167511299 diff --git a/4b284b21bc4seed3/global_step80108/layer_01-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..880d30cdcf4f1f034d5b875f0bdcd5876e0ceb5d --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aabd992251f48e67ea74a7fb8fa5ff5cbe77699184d15c425810ad0cc092ece2 +size 167511299 diff --git a/4b284b21bc4seed3/global_step80108/layer_03-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..048728e3361df22699a452c16124b4c95bc26ea0 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d780183d42cb40077cba73173bbef764bca9cfc80136090b3ffe20b7cad512a4 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_03-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b21552fac158bf6ad6edd90d862ffccb58f89704 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95bc484a054826647b4585ed501fed472da643fdc5f184c2fc12d615f0f7e0d4 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_04-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cd002d248348e089f0524feb230eab20e280fd1 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:025688ecad3e6e067bf756ae8a2ec74ca0462663497f1b8877b7ddec4ee745ce +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_04-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cdd0d65ac69c2878f1beb0e3371d3d45720551f --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8503a5f1f3e2fc2b9119fd0c72d8371914310b6117a193f254137e0faf48ec8 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_05-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0879c247ec2d497a0bb682525677aa1287bb4212 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48f03206f4456952f1f7843ec8394c8c10a0e88d16651bcb585d51178c4d4830 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_05-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e693d8fa5ac2940bb087734e0113a12a0541056c --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b435183738c821e47534749aee627901bf2ea5b4b47eed6669e5331139a86b58 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_06-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dc4469e9601615eb17021989be8cd5b043c2b8d --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14f053d8c592b3ad89e57406dfd3f5df544df38748144c8d3ee867cd8e821d11 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_06-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f7345e8d6db251280c14abd428ec21b1f976d19 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:142c0db985a3006311329145db1291173a3da5162fd4eccd00215fd68fb9b482 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_07-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b16465e119ca5dc5bed4262856d421ae10c0a11 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f7d8c202762ccdc0ca9dcb0fb38e9bef25b96be1c4a33524f9359d8d16ff3b5 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_07-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c38900a74c91035c50f069098bcb7a7c8714912 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bbf817736a99c547746ca97b654ef3395645b86b8018b9d1b7afc0cedb3f647 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_08-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2f6deb3dc937981ee255bda1b113c7d6939db96 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7246b4f5150a885b2f6b88c2b7b3c697b2ab1bbbcab7e7567fe84d95902fb608 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_08-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f70cb9dba56cd55a11eadfc70e0d67468a7e04f8 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22e234bdf6bb2036b9faead1bbc3791524bdc5157a202223415b62ebefab0166 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_09-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2070152166afb8cc5b885a8c95580a866b75c72 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a092d5ed2c04d6d85c3f897ad55aa3c7ecb199845b20c6808fc1e00ef2401381 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_09-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..854dd224c8d5b97cc6ff89868a76b913ddc67766 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a2f7e848814f3a3cbecf80c4b5bed0e2eb39a144d697a775ee9a911796b98cf +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_10-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c978d3f47a1a77d70a02a7852a6887286f329b9 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7c194c32c7e4484cc2ab8d0d2bbf7d2f742b08c61d602817a2b4beea223b88e +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_10-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b35d9b4b1010dd3eb4ba2236b2def595c57325c3 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a4443d925ff4310446d21af1f852d90bb62f6efdfdf7aaa6ef47cef196c7998 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_11-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59e0e9fef6f593940cfeaaab8b7537fa027b6fdf --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4b44df1a08411d9462b3f15d76f8c6497eaf99f642bb95c19402d9bbe03aa1c +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_11-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..738b12fbe812ee2899263a0ad70de8aae8004ac7 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26041bd5afe0a8101aaf7c411864ff0288d2f2b6091682d181ed2bbd66a0ee13 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_12-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..483a94268f22b4b4ddfd4fe6a127c653b14d3f86 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6395445a09ca2e455486f0081f800adeb2b7da3527b6ec53ee5a7d62971e4ad +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_12-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dda45a2f7230a75160953d6575c0431fabd4066f --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f00b28085a4e2d8b9f69cfe99d155c9b1b200a30ed525a630c06876e91e3bddb +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_13-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..909e374511339df6728829e9d1d189ed2c802071 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:937d091dae4db7775609ce8fcf07cdc89bbc109cc196abb8eb9c4b8e77f12325 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_13-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5aa515076d9804f971324ec46e983a0266d6a9e2 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4abb3f191f921f8ed7e973c4626a086b4d0d6cd045f44f323ee6d36735b913e7 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_14-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f782de010571f79a47dae9c9aa4ac411dcb99fa --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a38e6fd415ca18f67af1d522cd62fced67d235a4e4cef66bcb6938371739d60b +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_14-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d59b7d48b93233e3fb51cc38f8876ebfec5bf62 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a13e5764602def55007f9dadf10123720607a069a78e941fd6f919e0b5d3ff77 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_15-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..baa029a1bb2d4ead7a3df91e87189e8f83998a6b --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd7ef2f4167cc6f085c9979e17142da5fa552ac1a8ee87f57c54d5c441fcb7ce +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_15-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..345a95804a25e133d0085f0ea86c1bb58006b98d --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb9ad2a7e99852038ae8593ca1f09dcc8f5313a3ad031d75c9a9bb0dda6e460a +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_16-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4003cfd32f6cc77c17b645b096ee61d9515baf7 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a5b408b8a43f41018bb668fc6811641ad376c3516d885b554a8c248cd538d7d +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_16-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a10d6acccf727a092ec72dd453c77ea70da4e6d0 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60df622e138346492f29c016e2c741f4c9aae1c8accf2ba87563c8a1069b7a1e +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_17-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c46d35e892fd099b9090501d2028cfb613631f0e --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11b6ac843c88c363824ed0862f7e23ae77fcedcb282c2a6ecf25419783782b26 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_17-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78d484d901c9f69f29534e324e809c782ac62511 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f9958a80140ebc369bf094652ead88306154423da36f55488c92936885591b9 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_18-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee0715a2524aa5bacabb473d4c61c02202e372d1 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a448814609b0e78d799cdfe52e5c7968319c5a8a30dd021b567213184e75d465 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_18-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0f316cc68014657a61859fb76ce810728b05972 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ade39012c7fd2db045ba2129b122a15d04a38fcb49517826d79599f240d0688 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_19-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2e756c95c01e59f8ca6b4f5b0b87c1f5d8801c6 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e91fadbcf1570fa0009397f678ec6b6487cba4830724bed7469b7a440243be7 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_19-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..efe6498653bdd643bb4db6ab5fc4d74e66ec8813 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d68ca13defcd95a1cd08665a051be214a3efd9758377046b6090db410493ae9 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_20-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad760f5f3ce9c4587de96583b4fe83044a542c6d --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd73da617cc1abb88ac5812f83d16cbf3dd7fbf575eea279195474bf61ae1192 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_20-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7696f98b42ef888989740b631abde0acae96849e --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec7e95ec6679a5935775bbbd15973c4674b4b5a98b2cf9097f9dc366072c6b3e +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_21-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba30f5f598bb05a1c1b8de0a5f1eb3cd8369b0d5 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d6686f2d06bfb8717e1b2842ea05a734f9dbd95f728197eb9d25f47bd23236b +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_21-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6aa6ccd954b43374dff172e7af21df6308d06b8 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a746141630e5d8b3bcb8b8e364af3873c3af74466bc5b7c30388db61c8052459 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_22-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73204dbaf5814c2486f2dbcd87d068c633e878ba --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:513e25035c00e0ce0e0964116d93f0db338712fb0ed5ce82e34e86c904eeced7 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_22-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c18a579c64f2ffab82ca9ee14c973c4a8ba2d451 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c775678ad65e1410fc2ab4790d8b78eda92f179c37dbeeb259342771c726827 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_23-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13a3bbfd58bad0914836331855d71719949a7061 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64886b8f5e0c320e2e543c9bfd118a4ff730ef5870ea3afa652f8c1cfcab5f39 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_23-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68fb03fe94d5d0ebc1b5608f0885b888d1463d11 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:224d66c17e93cd23688b3a1d874f89c87a6a2ddf3a87e009fdfd90b2f40e1542 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_24-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d05cd809689079c83d787fbfd079f059c57c3bb4 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25f31aaf0893a73e8ae2edfe6e0ead0065ac64774f5107b0a283b717722e67a0 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_24-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ae8b75dee9c19bf808c009243520d5233a4e2be --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac8db9bd3d19ffb4ccb520236e37d017787bfb0202cd696380d26dee7c6fff3e +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_25-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2940deb02ac449ff06d1c87557a1c1d32fcb308c --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6636be800832caa1556fe2888ced71c3f1bdc540a281bb5f13676f31b34e587e +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_25-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9556b11983f85e39266256aabe17e3ab4764e246 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef1e3784692aa6958e9cf84bb24a7dd6f046961d8dcd6bd797bf7f0d8f4025e6 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_26-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77cce5acad6b9779eb6192a71f527f541204d014 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c44e6696fb40e4974363e0ec49315e0bbc61478bcec01c613e7d7c5e7cfd0ab7 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_26-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..889851dad55bdb3506edeece115189265ab30ae7 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:573055cdbd60585a6ea0ca8b39d20cadcc2563a303b005c1a95f0c9edb6fed8b +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_27-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f39e072cc57f43e7148ac52fa631a297d452c5d --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6b0e3dd09e0cb2b5b605c2788501a70cc10dadac3a3b90236ce35a73dd3f078 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_27-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..947c6d30d74cb8682a8d60111ce502b93ae037f2 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:921b3bb0dd761445142f352cc271954deb839a9a3688dc00e61a0e1c4b01dad0 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_28-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..499d48846049d3e88285c25eb90988de6227f3f8 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:739066a02ada4d5cc5c287f5395094a06363eb47f104e46b45c6235cffac2dec +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_28-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5947bf90ca37e2cdf433743b94a108f6650c6d84 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:538b75822ee65444ab5109abb374abcfce30edae12f74c2bc9b9ead1232a04c4 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_29-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46bc6a5b579ad7e11f432f55c5c608e7358b3972 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49091cbf5cab4dc53f03fce3beec4795b4ee242a0de9ff2a088b867d39368b99 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_29-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ede1a782957f2a4e18aaaeb87de40e2080d6458 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:824fa55b28310988850f6f60869e7416315889044630a871442ca2fd2dc3032c +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_30-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c62794fb23b4810c4992ab08946c93722db69bc --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:407a22c591c0b3bad4c7e5b64b52bc691c168cc4080d9a45aef9c2ee15efecb4 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_30-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..412539a77a83feb0422748a57879c7a9f518defb --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c5a0c98a4330f9ee0927ec892887857f46c8b2b75ae6fb5a756368a9124043d +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_31-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d4ff8987b3390e43ff872a5f74ab943bfdd7380 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dd55963b5860bfde8d723ff1c1e1d5db7895478fdcf32ef50f7c916fc6f01a0 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_31-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e770544244597a47b86f53fe7b9d35b808449b8 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60d21c7f2bd1f3fe8fde2eb9784f1ef7b77106b02a71ab7e737a0034ca8b02f2 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_32-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b7e4db9ac16af8d4c647479cbf0d1f08cdc0b6e --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e4c29843a7a57fe7bdf3d1ca31f07d744150cfc624eb5bac978ab834abf3ef6 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_32-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ab1c31a016e6a215586cd3f9d757c0fc6734c38 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3ae7f026abab488a80f52cf37f4e7038565ebd0791e8da3d0f0f222287163ea +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_33-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..032a49b14d3bfcc2b1b372c63ab07fe8eabfadd7 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17c505e90ba82c076bb376b032189a001c314b2003ab19ee6c9b281b8e68d597 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_33-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4531f0a21a3ccd2e317a6180b70c787cecba3650 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db0ca40a51568bb540d5ab2166eb077c3d17779c27f119d914ed2df00b18121c +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_34-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..482358a29c0a90bfdb012d5c3cef90e4eb9ad8a4 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a7ed7608bbb6577e2e1e9eae23aaf863b36f4dd2d201e559cf1530f5efb88ba +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_34-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9782b3a9f1b678a6f174819211a70edb2d1eb616 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f69254fcf2363cbc11d788989cf4f0b2ff45e4ae6ab8ef96393027d68ebfa6f +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_35-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6108dfc349f0826cb4a938672d42c38560be1e3 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beb3938314c41c6e77a14b6c4df66330ac064cc1e91f4b3fc717baff58c156d1 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_35-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89498aacbdc65a28a4ea985f5de6266831c6ac41 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ca34903d2919c4817356bcab51fefaa8b110c3c2aa75847befbfabd4ca06e46 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_36-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..716337aa845a32cba106cf08481ded09ef98d682 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfa699ec06eefb5d9ba8bdcf4b3e73484f8624e24b49f4ee7c99daad78edebcd +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_36-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8e0e56aa8866b9a523f741e73de81f3fdac1406 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3363a2902dff5a0018a42e4103836d8897a672296babfebd15b1f622a095d6d +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_37-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a760d3f94acf7f75afbe529900bb0c6376ad111d --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9c0e1e7ec000b8171c67704af323c59d7285feabac4b84982454fc3ed1b501f +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_37-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98b2e7dce1a32022a141c8b141f453183de55436 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:727b21a26695ca1bf1ccf01bb25dc041796f2207e8acb02f28c70909a0e7c849 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_38-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dff61ce377c68ddbbfbe288cfbec5476a5dae0a --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3717d4309b0dc1ef7b3dee1c723d1e83e632de5ee4ab011ecd6de445e87c67df +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_38-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10e391cb8357e176fd5eab87e45c9c4778aa0516 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7f5e3de9bd3beb19b20a866dd73c38df481a5af5950fb08e0f9af8f398c06c8 +size 113308931 diff --git a/4b284b21bc4seed3/global_step80108/layer_40-model_00-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88ff04d13fe86479afefcf35ad204c16f18a0925 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a81a9b0d4c13ecb1438313c2253310429b6a5afffc2c847e12c3a2e19abe65cf +size 13507 diff --git a/4b284b21bc4seed3/global_step80108/layer_40-model_01-model_states.pt b/4b284b21bc4seed3/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de92e8479dfc37736df898231d6ff7399c10afc4 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3dfbe6bef00ec0b89b7d51b646e43fbd4ee3fa61ddb20334167ea61705ae7ef +size 13507 diff --git a/4b284b21bc4seed3/global_step80108/mp_rank_00_model_states.pt b/4b284b21bc4seed3/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..620eabd15ed9aa3dc63df368809e17314e78d119 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f25a8462be7f279ddcb3ce4ae9ce3b2e1614f6594bb4df43e8c15b9082c6c1b +size 51507 diff --git a/4b284b21bc4seed3/global_step80108/mp_rank_01_model_states.pt b/4b284b21bc4seed3/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..782024160780482a0f6b3afb3ec11c55b17b9026 --- /dev/null +++ b/4b284b21bc4seed3/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33c3ab3881fbe8539c130aafe97fd41d04f9d468ccdc5cddbcec6fafc3a9b142 +size 51507 diff --git a/4b284b21bc4seed3/transformers/config.json b/4b284b21bc4seed3/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b21bc4seed3/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b21bc4seed3/transformers/pytorch_model.bin b/4b284b21bc4seed3/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..7d48750e4b1f69e327f0b1d98e6a126160346393 --- /dev/null +++ b/4b284b21bc4seed3/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b1f25408363543a27c6dc446ed6b123f79019eeb0cf53d31ad6bf4f9d2696c1 +size 8781203669 diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..f75afc940e4f23b8654b487f487f41f2190119f4 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.3751221736027223, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04603981713785397}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07050754951097193, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0015950749741378038}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2930621241248632, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0047039720667729585}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10655282549139757, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002069892427617646}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03327005966333133, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009772300003902292}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.14224611225552608, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0031500776280318555}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05052209059024575, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012866888304456589}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.0677233404229661, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014833039402630307}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.28507940697548506, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004611898165464154}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10267935520945128, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019389896303185993}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06739541442277049, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015164320427077738}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.27995528365978256, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004446276996131344}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10179374812954574, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019553887116743455}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..efe728afc7049922276d3116d212e3e201d68f30 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5198830574890386, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03504017360483535}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07738811110777072, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0015304988936609128}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3862577997016925, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00572058610283539}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12070700921084229, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002002150459250641}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03507152315512706, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008467381062339321}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.18709836433905874, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003833792467120382}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05531307099139748, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012137549494064656}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07158564602943736, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013356095688320767}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3620899416623159, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.005273165348503305}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11194710382233043, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017263614451165634}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07309280304036243, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014294724139865343}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.36442715703356776, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.005241997303110117}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11393170029640054, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018446583441229345}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..8c72092c0111fa19ce15286d3c5dde0ec961f67e --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5772980788839762, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0351401276773091}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07813906472896695, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013627013823755202}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4101295780853266, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005693087311032938}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12373316030300299, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018974475884765722}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03581354421318794, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008022617515173707}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.2032111746093155, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003954708803559}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.0570319859750151, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011521977790571885}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07158825167996366, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011655724191791303}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3794140508633469, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.005145968326494213}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11350896035348979, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016169887067107285}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07387016720939305, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012627844516927061}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.38737624946784815, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.005248864126942714}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11690863992503238, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017500511668341343}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..9df9d6d45b2ef651381605d33ae582d68fbccf75 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6456226857113138, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.040165536189754096}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0778881396479436, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012769567386518232}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.42296024366383517, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00569044382493207}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12436437584313036, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001814950124577219}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03521828535740504, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007298691703855176}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20809711310932535, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003931907827643346}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05661337603042263, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001071749411178637}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07076272874827239, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011113411679509696}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3866270125315969, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.005107912406441445}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11292204203780767, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015573442585516018}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.0732788083787352, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011890321940136864}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.39617638119143006, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0051662731631678}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1168466330708585, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016763512625120776}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..047bcd8747021143c9c4d7860a22a3c33b917d95 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.7394949248334012, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0375339718418186}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07935954064608862, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012440228309059662}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.44189075126537175, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0056160164221400995}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12719292338738244, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017548996669778086}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03609299322498633, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007391134009433947}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.21980568290237434, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.004020542118197972}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.058223377247645175, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001073250860654579}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07145742950585998, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0010699196551391536}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3991369324047731, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0049417529681389525}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1144359922322097, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014869489906081234}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07454021703025861, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011655709781687874}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.41368909933661674, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.005127640598028314}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11931787390462796, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016294893480413802}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..450cd7dc9c1de6a87be8062330933a45e543ea1f --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.7350884275632563, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04285525370548216}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07963440574460627, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012450999827039412}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.450750421306443, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005688854042032203}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12790081410584203, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001762758952960184}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03626337631746513, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007247188269312321}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.22702405178339297, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.004195235523736308}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.058684632135392434, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010628257100155462}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07125643393688096, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00105707615542693}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.4063747251874938, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.005069676186964856}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11440641190075858, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014753694031490337}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07452930873504321, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011537233047546483}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.42116829387113064, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.005204895411040752}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11957698534047122, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016217012306438583}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..30541ceed5195b7b03eafde9fae9492b0a07c54e --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.15229529499726693, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018532935787449235}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2584223718261279, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025516613510239644}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17846806393672296, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018156572490314613}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.030189999709011046, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007527178027814116}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05276107785013939, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0013537005512275853}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.035498190179559366, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008425007414760624}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11790693896267036, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001294367886229787}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.20826559324975696, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0020968023223764095}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13992548854671796, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012925170885687428}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1388827214194179, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016844636725997805}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2370411466342553, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002357902527598024}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.16300806309885615, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016517242441511555}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.5445764212442845, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.046348567423538295}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..8c301ef9e7aec061b03909b84aaabe339cf90e03 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.19660419529835046, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0021703512663018435}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.33305075642202464, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027422057559937344}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.22871763440008758, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019504250194142293}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.048646612266404474, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010079743018688542}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.08571356139913104, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017928353996558705}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.056810181676750955, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010692773805419653}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.13473919020916866, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014138439503997033}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.2377264850157444, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022081866868395457}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1584532961497466, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012813295440813953}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.18408931555378133, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020314434795525877}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.3130915982176866, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002608677189171684}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.21440206759227748, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018298647451743082}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.9354736259244234, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08184998217131226}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..73cc74ea431d7ad6bb4357a34d5d1fd1aa4e9c08 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.19308251629949974, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0021372296672672315}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.3226572993341573, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002715283947112145}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.2216752304780583, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018496410521841634}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.04755808223353882, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001056965112675896}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.08157607236301773, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016928843275132437}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05419402589748163, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010092487989924672}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.13475955724902108, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015213837884005157}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.23151769344902068, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002143281502769755}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15534336307223465, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012446244313757237}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.18213738467572518, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020147435204007475}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.3053278835262653, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025811768541287375}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.2092469074780288, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017297088792391818}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.988336179481119, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07284534182808335}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..db8d791bc884feb1485772acc3cb91122123caf5 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.16818607657817242, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002571340600589284}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2618591281994728, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0033215062620397654}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.18235828185303843, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022330522398271444}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.039906055320126824, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011176532929901056}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06504905939729995, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016338067696316037}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04352751746326409, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.000986420480404656}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11910589220232795, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001919539273889145}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.18906464586111238, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002550157025960148}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.12850084937451378, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015346657748469231}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1592819269786109, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0024458047067507224}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.24869687852492026, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00317986279337076}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.17275184259901263, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021141809407287217}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.955313094852994, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0766356215689601}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..1c821901effbe62b35eba79a2079c7bd13f9a24d --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.05651284854563454, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002164889280586853}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.08771427792659671, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003046668032178251}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.0587450878634487, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001987849748246455}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.01373423070578025, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007944242550989159}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.023902876010557156, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012871698398313374}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.014698951085450463, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007071025730658953}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.041455127649633716, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001604158922614608}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.06565381938564946, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002338953948684061}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.04283521055248602, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001420656788711465}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.053065857077570854, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020380922902812288}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.08260798722441874, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002886226452230474}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.05516099966060376, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018676755144161564}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.6681174311441812, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.044021606714169687}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..b9defe276f3f8972ff8c277eb72e3173ef921660 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.008744552174562775, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0008820534430831269}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.014063870074080958, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0013626675606431993}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.009157992753346606, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.000856510665924713}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.001867598511771763, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0002589055645534681}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0037526556188222397, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0005665830894881638}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.002073109168721178, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00025579423912383813}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.006278467313776165, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0006318463479225579}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.010544788230721835, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0010639298188298192}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.006597140236099842, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006134117940431641}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.00823467650006455, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.000829000231276819}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.013318449806788014, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0012936214066513207}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.008602211224573027, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0007971656716790751}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 8.138411373037316e-07, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.7429365149014433e-06}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..3275828e2c98d36d327f8796c82db958b8cd4607 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 0.1675172437507659, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.027600643399440884}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.028701737940994714, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0010195754285503126}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.02982766113489123, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0008471594561940423}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.024088126860004336, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0006566077823850723}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.0015626210476206773, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0003728911300811695}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.0014347430615192808, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00023769294132393532}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.001114996015022125, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00018328608469909375}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.028417386089142856, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0009947648295870358}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.029685273969587405, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00083480831932383}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.023944632138488853, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006463198681447033}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.02728685295948081, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0009885875546693994}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.02727004908623676, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0007114664570306672}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.022309991073370505, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0005760998972707722}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..11b4d4858ab98e3e6a0ab2974f53861f93c633c2 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 5.8311861735166675, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06388138684732117}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.2601081962246765, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0021349255671127927}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4686781469942304, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002825480648369596}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3211813837867464, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002018437643374035}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.10907314684339463, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0013682678699487114}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.1992897827723483, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021146365213576476}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.13429472916574672, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014217210935365725}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2056686183422757, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015071237696962308}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.37982651296992087, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023920704305803887}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.25612256110358006, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014268806319662325}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.2117404050410904, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0019554275881996357}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.379262023761823, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026640542361163967}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2605843619987691, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019094298729220246}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..33bc0877539e626ce5ea4c85827aa97019c13ae3 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 8.283032143741265, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.12324083863995262}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.3538185229938564, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0026093673205933284}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.47654923761453416, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002742670643307486}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.386855872645816, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021481774383948936}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.16058763409752866, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0017929892307175898}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2186758841759895, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021644223522511653}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.17540917102638537, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001676199795834029}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2634180709043917, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019363360461210728}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3633286847976612, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002418760103075258}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.29032162387497273, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016448424366105137}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.2943420649549215, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0024049285177976626}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.396021431067016, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026539511959613863}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3215658810211159, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020865232232060243}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..61e34a954842e47b4a5691a17b7588856b8d0af0 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 10.390741038004455, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.16864807456665598}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4170328570049967, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002406804998864227}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4755330496164165, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027356944570645627}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4265219434574998, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00200022371619217}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.19311277752964032, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0018435166685741753}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2234558315509727, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00217671447753381}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.19794956049387477, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0017257612820525093}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3018404766668879, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019954675660840008}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.34733784496925735, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002410859115489849}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.30937209897451035, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017399874604572011}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.34804273669533864, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002320309559338597}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.39674483976023345, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002636069670789193}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.35577353404582346, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002018349673780584}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..cb586148dc917c901fc4e8f43ea8996b3a467bcf --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.329341641449828, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.17960715134758612}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.43540537755676456, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0023276114946809037}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4809839727831288, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026909272047918853}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4404396724578438, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019501997658908016}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.20335070986022913, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0018630249723704795}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2277953855378017, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002231447665036813}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.20632107444632167, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0017999776378623833}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.31052804922692206, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019906703253583058}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.34538706806048836, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024265779869813795}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3146665867607543, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001793539263470212}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.36360422785078816, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002278768446357271}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.40267975309659465, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002691014459855529}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3681598682721843, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020492701030304073}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..7ff2f383bb0716a81c2eff049d292ebcd93f6b30 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.285255750718802, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.18888005349774178}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4365680288096621, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0023563761935207865}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.48375423799463574, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002636920734911192}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4415151553259178, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018967405556148942}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2041613364300487, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0018478653045982886}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2286562929012743, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021444262626903934}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.20666903463506434, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0017287346978560685}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3097317177052037, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019875430217516188}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3463247383671021, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024086631359451073}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.31404489497308175, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017489740232863793}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.36511129451802127, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002275854131726726}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.40524349161687195, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002592210635732001}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3693839714597318, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001956221447002133}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_gem_xsum_article_DOC_summary_0.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..da6619e13c2b095fa2ae7ee29b3278fb4c4a842d --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.16661991011320432, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0024239320503688508}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3334279529769119, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004505784466073162}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.21238019045835924, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026416842263647295}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.036458947908946444, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0013971876206545527}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07797973705513334, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0027575216878305796}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0474651150579007, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0016508808672473486}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.12350643841301835, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0018449748802517576}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.24834266376447475, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0034694940835095387}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1574172507962458, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019726023490667156}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.12930576998616114, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001943629127681205}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2628771358874318, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003928661472441744}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.16564203891769072, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021922015182424493}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.9920111933130942, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09083971543338792}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_gem_xsum_article_DOC_summary_1.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..e3aee59017cf66cc0b261339068a4d5789dc3b58 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12220764132281824, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017962553489656822}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3046016264780442, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004195472170007382}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17238543114114188, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024273582171495467}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02404240814314951, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009715966898615973}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06279570551371068, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0026393784630938297}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03433659588366439, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013916698462749025}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0948627092015581, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013564109394382858}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.23873232992980792, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0033732063257411065}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13411490255282393, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001857806891825946}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09744320598123982, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014533168661689533}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.24526431304855986, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0036135020193240157}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1377971067717085, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019961553438677753}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.3911048134042985, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10897719788542379}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_gem_xsum_article_DOC_summary_2.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..44f3bca63cc4a18b0a0932062585cf8f9a2d4901 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12742301658282565, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018019437038001125}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.31650559447584714, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0041632693268193}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1796260802555828, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024295120173709354}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.026873267786760833, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010274689542246274}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06937748072287012, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002720274634345644}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03828129617404584, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014588717099132717}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09972086437810422, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013615528035081867}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.25006918430896163, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0033224978911440477}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14088593992593365, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018545171064126879}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10228150708865971, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001498292749384224}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2564975734365291, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003645659171226953}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14453096950758154, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020492721061134787}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.5131027243134945, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09818604218520245}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_gem_xsum_article_DOC_summary_3.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..502f9f0dd82103b0304d28a45d375d4f00055839 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12560830490871291, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019805809749753123}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.30202505876515096, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004562458827775563}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17393387340194993, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026232973050223565}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02632965637304347, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010168079119372074}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06654262996214515, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002628246685221607}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03719404523373464, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014264985251086694}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09872111817099473, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015538240912434773}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.23817398946563523, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0036574265400714056}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1367280753200056, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020569662559889986}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10088738488275732, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016123154477431468}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.24479219612186495, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0038858502767361853}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13995698919988145, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021562163365348155}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.5589813395856684, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10558852439347298}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_gem_xsum_article_DOC_summary_4.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..536c9f61d6d81cb5edf0dfade0ffc77f7e3c27c5 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.039875289966317076, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0024501045936788945}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.07430021940128062, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004312735443842743}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.04714278099581509, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002671918175318051}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.00812289150475277, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009151347143203979}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.016372857345750558, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015796426861189893}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.009927038748098277, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009411928436840111}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.031900774626537044, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0020006091032227793}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.058775527889088235, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0033989669828951557}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.03725830963733278, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020970987843492487}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.03342763825361942, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002105461480850086}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.06157534488712963, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003610155719272957}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.03901707398161308, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022151386053289395}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.7800465095373856, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.110140635740535}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_gem_xsum_article_DOC_summary_5.json b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..124d9e526e17649e0eb60874357b548a4850dfc6 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/agg.4b284b21bc4seed4_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0033882933420727682, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.000994288954345408}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.002780937524962328, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0007843603020955971}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.0030037230280197226, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008566665942648847}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.001120152102248019, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0004966314099881747}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0009065462839047746, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0004161603469287444}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.000983708450751863, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0004420715282406731}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0026091624396139845, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0007993813642794688}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.002187358356350872, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0006548878815934947}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.002337297608841716, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0007032854409325233}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0028561523161821077, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.000870682583927747}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.002361092427287286, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0006961516518425747}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.002540252346941857, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0007562653583340974}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 6.009065394749386e-37, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.386737757665829e-31}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6199b16e220d6df95cf9944b39cc4b18d22ceeec --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7116ca8394e0b40ef4246ef90a305e8f338d5a81addf3e2b4d466c61cbbdc96 +size 4134740 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0e8d1bfb4fc0c6a86e4523c6c6fd4388ed4246a3 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b256c7bffd6f2ebb88ab5cb9c006cbdc6ec2afb40f6ee6cc7c313733c9e8ef11 +size 5116995 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..436bd6173e5c8efa933b7e5354eaa8cab0778213 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a971348c6258021056650a1cdb0f13c60e2103ab5c4e169666a6c284263d6880 +size 6022132 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b4a8219dc93e8b5e5012099e91c34cd464f978e5 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d09d6dfb6fc3736c607432e9c36aeec2ff2b9601c76f45967eb0e4d92b68300 +size 6942145 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..499c9b06e410560af5acf82e1ecd1e67660168f4 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27091cb8ade9a0095b4e0410c1c8f1f179a9b377e9101674bed06772c9a28003 +size 7856422 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1b81797b159c478a2492618920e0fa1ed0a247d9 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f19d9f536ae74eb819f2da05cd451024f519565a919776b9b5e75eb55b2e7a7 +size 8768681 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6307a983ab4d0900d471b002a5250659a9be02aa --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97b975ef2d3cb52f63212a3603cc7eba7e618fe28634751d5092616f483834d9 +size 7705113 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..95aa42caa9e453eab2664b4c8d54f80e7c0f1396 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16b0ccc9a49943d0758752b9d70f66c94d59a4bd63504a28046e7a7e4eeeae30 +size 13327650 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..833c1205143da79199e0407fad2d80e60810c709 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60104c91055808be224576927e1fe09c82f65d3cca16b49d9fce9d6b4cc7739b +size 18923008 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a4ea687567843ad1b37afd0c74d6b8a15e06c0a3 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8a2fcf09b7c5e8075a8aa8804b4e02fb61abe1365b4982ed0f8770fc8a5211e +size 24326604 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..07ca4415ea07f45a0ff434aefb70755e66ee36b8 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6af86393cc761e6bd3b455da7c045591e434635b1f4e286c746e430193eefb5f +size 29469079 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..43632dd5f5d4cba1e9cef1bf2465de9338094b65 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b8275a77bb464adf5e1af85ff125bbc5bc258a30b77be53411b16c4248da1aa +size 34799892 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..86f07b49318e57f7c50c5604058acddcbf2ae9f2 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3189c3d1461a62bf3c1b6d81754a120b18c1995bd59129ca95bec4f8c9604b2b +size 4420695 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6cf9678dd4aa75c79e02da4dd0e179dbbdb7c517 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c128c90b3a524940d4bb807714f38c7714157acffcdf074c63f201a787f3145a +size 5496198 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6b51b2b919209d1be87e1f0ed88afc5836761cbd --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:492d052b9b1a1783bb9efcc8a9e8a7619d5cc1b4e9a48780782047d53219cbc6 +size 6400193 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..643476a17f9fa8c706e47366f776e5bdc32c91db --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e865dbf3d2fe3c1e7dc3af47b37ecccc4fbcf320a1fa619410b4eaf0e30c0926 +size 7357952 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5286460c71d240dfbcdb7747fdcf7603ef839d0a --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41522feb72bf9525430367476b1a37743e28ea60758261f92450cdd2f8f60816 +size 8412249 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..746c494030a42040d31ed6505b6db9e1cb1cd876 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69e5e36dbc5f3ab3fac1b47194c515640dacb842fac3ddad83848446b3a82bf5 +size 9504276 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_gem_xsum_article_DOC_summary_0.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e30c3ac3f9afd61b2ff416a553b44a7c430fd89c --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f434e2c23bf88e366c9f50808dceb975251bd71203026fa65847881705d85a34 +size 2791496 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_gem_xsum_article_DOC_summary_1.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3f285966f8a1265bf8a0816ba23152dbff1d8078 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:970cff07f46e99aa88f9bc1639442847bb088363adeda9a0eea342eb85eaab25 +size 5100828 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_gem_xsum_article_DOC_summary_2.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5251388b2511bc848b39c933cf378fbcabbf94b5 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd1ab0bcdad719d3fb426f579d739196293cc5a452552b7844940b1d9bb86413 +size 7375759 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_gem_xsum_article_DOC_summary_3.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0a727ca0ec1f544f5748d10b1fbd795c8b48904b --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1b2d565fad3e80107fb423c8a82ec148a9cac67fef4b16ad0a37da24b150f80 +size 9643048 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_gem_xsum_article_DOC_summary_4.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..323b873d7c182fde76acd0aa78eadf30e4711cc2 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cb26d1161683efeb407cade6e76a91123c6e88f946ea5453d6a5912978c37e8 +size 11671282 diff --git a/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_gem_xsum_article_DOC_summary_5.jsonl b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..739b4dd546ca33665de2e758680f37359f25735e --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/examples.4b284b21bc4seed4_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6815a540ba94104cf1af3df82a11e7fd8b53c7a18051622655267d938cd25a07 +size 13897571 diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e12ee97e7cabab024503a5a8a83f97f8f674223b --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.3751221736027223, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04603981713785397 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07050754951097193, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0015950749741378038 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2930621241248632, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0047039720667729585 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10655282549139757, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002069892427617646 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03327005966333133, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009772300003902292 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.14224611225552608, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0031500776280318555 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05052209059024575, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012866888304456589 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.0677233404229661, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014833039402630307 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.28507940697548506, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004611898165464154 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10267935520945128, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0019389896303185993 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06739541442277049, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0015164320427077738 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.27995528365978256, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004446276996131344 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10179374812954574, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019553887116743455 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..70dcba0c350878ff4cfee8da17cd341054fb11be --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5198830574890386, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03504017360483535 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07738811110777072, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0015304988936609128 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3862577997016925, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00572058610283539 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12070700921084229, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002002150459250641 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03507152315512706, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008467381062339321 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.18709836433905874, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003833792467120382 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05531307099139748, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012137549494064656 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07158564602943736, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013356095688320767 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3620899416623159, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.005273165348503305 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11194710382233043, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0017263614451165634 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07309280304036243, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0014294724139865343 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.36442715703356776, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.005241997303110117 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11393170029640054, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018446583441229345 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..602efbe78522b1faae2a46e25ea8763006de6dca --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5772980788839762, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0351401276773091 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07813906472896695, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013627013823755202 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4101295780853266, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005693087311032938 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12373316030300299, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018974475884765722 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03581354421318794, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008022617515173707 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.2032111746093155, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003954708803559 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.0570319859750151, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011521977790571885 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07158825167996366, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011655724191791303 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3794140508633469, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.005145968326494213 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11350896035348979, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016169887067107285 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07387016720939305, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012627844516927061 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.38737624946784815, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.005248864126942714 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11690863992503238, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017500511668341343 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..9209bc941d56ac67a1d0216fb570649183e16983 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6456226857113138, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.040165536189754096 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0778881396479436, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012769567386518232 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.42296024366383517, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00569044382493207 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12436437584313036, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001814950124577219 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03521828535740504, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007298691703855176 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20809711310932535, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003931907827643346 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05661337603042263, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001071749411178637 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07076272874827239, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011113411679509696 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3866270125315969, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.005107912406441445 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11292204203780767, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015573442585516018 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.0732788083787352, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011890321940136864 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.39617638119143006, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0051662731631678 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1168466330708585, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016763512625120776 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..f63adfe403eed09eb67b483c076d9a7e2e5db595 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.7394949248334012, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0375339718418186 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07935954064608862, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012440228309059662 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.44189075126537175, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0056160164221400995 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12719292338738244, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017548996669778086 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03609299322498633, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007391134009433947 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.21980568290237434, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.004020542118197972 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.058223377247645175, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001073250860654579 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07145742950585998, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0010699196551391536 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3991369324047731, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0049417529681389525 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1144359922322097, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014869489906081234 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07454021703025861, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011655709781687874 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.41368909933661674, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.005127640598028314 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11931787390462796, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016294893480413802 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..7fcdac4161823a30190c01f1e1f8e009c5a79fcb --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.7350884275632563, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04285525370548216 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07963440574460627, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012450999827039412 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.450750421306443, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005688854042032203 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12790081410584203, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001762758952960184 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03626337631746513, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007247188269312321 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.22702405178339297, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.004195235523736308 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.058684632135392434, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010628257100155462 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07125643393688096, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.00105707615542693 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.4063747251874938, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.005069676186964856 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11440641190075858, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014753694031490337 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07452930873504321, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011537233047546483 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.42116829387113064, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.005204895411040752 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11957698534047122, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016217012306438583 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..337d1377704e551f27b1773e08140e62a9c04f35 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.15229529499726693, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018532935787449235 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2584223718261279, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0025516613510239644 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17846806393672296, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018156572490314613 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.030189999709011046, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007527178027814116 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05276107785013939, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0013537005512275853 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.035498190179559366, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008425007414760624 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11790693896267036, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001294367886229787 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.20826559324975696, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0020968023223764095 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13992548854671796, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012925170885687428 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1388827214194179, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0016844636725997805 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2370411466342553, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002357902527598024 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.16300806309885615, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016517242441511555 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.5445764212442845, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.046348567423538295 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..52e2cb0efd9e2716987ef010bfa1109899d1fe65 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.19660419529835046, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0021703512663018435 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.33305075642202464, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0027422057559937344 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.22871763440008758, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019504250194142293 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.048646612266404474, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0010079743018688542 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.08571356139913104, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0017928353996558705 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.056810181676750955, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010692773805419653 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.13473919020916866, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014138439503997033 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.2377264850157444, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022081866868395457 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1584532961497466, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012813295440813953 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.18408931555378133, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0020314434795525877 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.3130915982176866, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002608677189171684 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.21440206759227748, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018298647451743082 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.9354736259244234, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.08184998217131226 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..e178fd80fffd3d06f9e0ec0aa51d684413e06177 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.19308251629949974, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0021372296672672315 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.3226572993341573, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002715283947112145 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.2216752304780583, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018496410521841634 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.04755808223353882, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001056965112675896 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.08157607236301773, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016928843275132437 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05419402589748163, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010092487989924672 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.13475955724902108, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015213837884005157 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.23151769344902068, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002143281502769755 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15534336307223465, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012446244313757237 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.18213738467572518, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0020147435204007475 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.3053278835262653, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0025811768541287375 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.2092469074780288, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017297088792391818 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.988336179481119, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.07284534182808335 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..5bbb3afc063d70093616285de2e8adb81023242f --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.16818607657817242, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002571340600589284 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2618591281994728, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0033215062620397654 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.18235828185303843, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0022330522398271444 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.039906055320126824, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0011176532929901056 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06504905939729995, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016338067696316037 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04352751746326409, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.000986420480404656 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11910589220232795, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001919539273889145 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.18906464586111238, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002550157025960148 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.12850084937451378, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015346657748469231 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1592819269786109, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0024458047067507224 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.24869687852492026, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00317986279337076 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.17275184259901263, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0021141809407287217 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.955313094852994, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0766356215689601 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..6be6bfaeb631e7643e3893da3e81fced56471a5d --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.05651284854563454, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002164889280586853 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.08771427792659671, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.003046668032178251 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.0587450878634487, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001987849748246455 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.01373423070578025, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007944242550989159 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.023902876010557156, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012871698398313374 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.014698951085450463, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007071025730658953 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.041455127649633716, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001604158922614608 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.06565381938564946, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002338953948684061 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.04283521055248602, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001420656788711465 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.053065857077570854, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0020380922902812288 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.08260798722441874, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002886226452230474 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.05516099966060376, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018676755144161564 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.6681174311441812, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.044021606714169687 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..61b20391d47452037e19fce1dd89713515606307 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.008744552174562775, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0008820534430831269 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.014063870074080958, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0013626675606431993 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.009157992753346606, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.000856510665924713 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.001867598511771763, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0002589055645534681 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0037526556188222397, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0005665830894881638 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.002073109168721178, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00025579423912383813 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.006278467313776165, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0006318463479225579 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.010544788230721835, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0010639298188298192 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.006597140236099842, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0006134117940431641 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.00823467650006455, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.000829000231276819 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.013318449806788014, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0012936214066513207 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.008602211224573027, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0007971656716790751 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 8.138411373037316e-07, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 1.7429365149014433e-06 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..f33a05ed4ead022034cc308fa632f372d8562b32 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 0.1675172437507659, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.027600643399440884 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.028701737940994714, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0010195754285503126 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.02982766113489123, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0008471594561940423 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.024088126860004336, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0006566077823850723 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.0015626210476206773, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0003728911300811695 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.0014347430615192808, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.00023769294132393532 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.001114996015022125, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.00018328608469909375 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.028417386089142856, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0009947648295870358 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.029685273969587405, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.00083480831932383 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.023944632138488853, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0006463198681447033 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.02728685295948081, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0009885875546693994 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.02727004908623676, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0007114664570306672 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.022309991073370505, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0005760998972707722 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..a1d979ff88d0b3a1ea5337ae3e4923b862fb4845 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 5.8311861735166675, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.06388138684732117 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.2601081962246765, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0021349255671127927 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4686781469942304, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002825480648369596 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3211813837867464, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002018437643374035 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.10907314684339463, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0013682678699487114 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.1992897827723483, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021146365213576476 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.13429472916574672, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0014217210935365725 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2056686183422757, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0015071237696962308 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.37982651296992087, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023920704305803887 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.25612256110358006, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0014268806319662325 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.2117404050410904, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0019554275881996357 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.379262023761823, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026640542361163967 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2605843619987691, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019094298729220246 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..22149b9cc8177d7102d14fc7e79a1b4fe023b45a --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 8.283032143741265, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.12324083863995262 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.3538185229938564, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0026093673205933284 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.47654923761453416, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002742670643307486 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.386855872645816, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0021481774383948936 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.16058763409752866, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0017929892307175898 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2186758841759895, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021644223522511653 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.17540917102638537, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001676199795834029 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2634180709043917, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0019363360461210728 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3633286847976612, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002418760103075258 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.29032162387497273, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0016448424366105137 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.2943420649549215, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0024049285177976626 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.396021431067016, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026539511959613863 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3215658810211159, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020865232232060243 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..cc7948939d160bc7497eb190962574f56cc27e22 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 10.390741038004455, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.16864807456665598 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4170328570049967, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.002406804998864227 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4755330496164165, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027356944570645627 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4265219434574998, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.00200022371619217 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.19311277752964032, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0018435166685741753 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2234558315509727, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.00217671447753381 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.19794956049387477, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0017257612820525093 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3018404766668879, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0019954675660840008 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.34733784496925735, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002410859115489849 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.30937209897451035, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0017399874604572011 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.34804273669533864, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002320309559338597 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.39674483976023345, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002636069670789193 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.35577353404582346, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002018349673780584 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..10251aa1748149c09ae2e255e28ee286442d2e33 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.329341641449828, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.17960715134758612 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.43540537755676456, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0023276114946809037 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4809839727831288, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0026909272047918853 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4404396724578438, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0019501997658908016 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.20335070986022913, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0018630249723704795 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2277953855378017, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002231447665036813 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.20632107444632167, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0017999776378623833 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.31052804922692206, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0019906703253583058 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.34538706806048836, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024265779869813795 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3146665867607543, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001793539263470212 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.36360422785078816, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002278768446357271 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.40267975309659465, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002691014459855529 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3681598682721843, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020492701030304073 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..ac6afbed6be51560bfdfb80150e281e7ee76841b --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.285255750718802, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.18888005349774178 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4365680288096621, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0023563761935207865 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.48375423799463574, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002636920734911192 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4415151553259178, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0018967405556148942 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2041613364300487, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0018478653045982886 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2286562929012743, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021444262626903934 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.20666903463506434, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0017287346978560685 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3097317177052037, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0019875430217516188 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3463247383671021, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024086631359451073 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.31404489497308175, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0017489740232863793 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.36511129451802127, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002275854131726726 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.40524349161687195, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002592210635732001 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3693839714597318, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001956221447002133 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_gem_xsum_article_DOC_summary_0.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..4faf90c9953a2471a098878e78691e7c5ffe3893 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.16661991011320432, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0024239320503688508 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3334279529769119, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004505784466073162 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.21238019045835924, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0026416842263647295 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.036458947908946444, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0013971876206545527 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07797973705513334, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0027575216878305796 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0474651150579007, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0016508808672473486 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.12350643841301835, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0018449748802517576 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.24834266376447475, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0034694940835095387 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1574172507962458, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019726023490667156 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.12930576998616114, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001943629127681205 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2628771358874318, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003928661472441744 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.16564203891769072, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0021922015182424493 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.9920111933130942, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09083971543338792 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_gem_xsum_article_DOC_summary_1.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..504387ad2cc49f7c84ed97a2ad19e815964321ae --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12220764132281824, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0017962553489656822 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3046016264780442, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004195472170007382 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17238543114114188, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0024273582171495467 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02404240814314951, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009715966898615973 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06279570551371068, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0026393784630938297 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03433659588366439, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0013916698462749025 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0948627092015581, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013564109394382858 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.23873232992980792, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0033732063257411065 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13411490255282393, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001857806891825946 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09744320598123982, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014533168661689533 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.24526431304855986, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0036135020193240157 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1377971067717085, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0019961553438677753 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.3911048134042985, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.10897719788542379 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_gem_xsum_article_DOC_summary_2.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..8f7c333e1ca05664edb1d27d8ce8af8180154c89 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12742301658282565, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018019437038001125 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.31650559447584714, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0041632693268193 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1796260802555828, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0024295120173709354 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.026873267786760833, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010274689542246274 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06937748072287012, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002720274634345644 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03828129617404584, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014588717099132717 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09972086437810422, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013615528035081867 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.25006918430896163, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0033224978911440477 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14088593992593365, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018545171064126879 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10228150708865971, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001498292749384224 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2564975734365291, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003645659171226953 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14453096950758154, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020492721061134787 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.5131027243134945, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09818604218520245 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_gem_xsum_article_DOC_summary_3.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..e4213d253c482d202ba5fc7103cfa888a2495f6d --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12560830490871291, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0019805809749753123 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.30202505876515096, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004562458827775563 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17393387340194993, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0026232973050223565 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02632965637304347, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010168079119372074 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06654262996214515, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002628246685221607 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03719404523373464, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014264985251086694 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09872111817099473, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0015538240912434773 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.23817398946563523, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0036574265400714056 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1367280753200056, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0020569662559889986 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10088738488275732, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0016123154477431468 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.24479219612186495, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0038858502767361853 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13995698919988145, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0021562163365348155 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.5589813395856684, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.10558852439347298 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_gem_xsum_article_DOC_summary_4.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..b733831c3aa57647dff628a84aa1aaf4278a7747 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.039875289966317076, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0024501045936788945 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.07430021940128062, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004312735443842743 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.04714278099581509, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002671918175318051 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.00812289150475277, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009151347143203979 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.016372857345750558, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0015796426861189893 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.009927038748098277, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0009411928436840111 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.031900774626537044, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0020006091032227793 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.058775527889088235, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0033989669828951557 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.03725830963733278, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0020970987843492487 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.03342763825361942, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.002105461480850086 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.06157534488712963, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003610155719272957 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.03901707398161308, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0022151386053289395 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.7800465095373856, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.110140635740535 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_gem_xsum_article_DOC_summary_5.json b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..a5dbde9b0e42f22322b6f8c16e9842b92c18811f --- /dev/null +++ b/4b284b21bc4seed4/evaluation/generation/slim.4b284b21bc4seed4_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0033882933420727682, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.000994288954345408 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.002780937524962328, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0007843603020955971 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.0030037230280197226, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0008566665942648847 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.001120152102248019, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0004966314099881747 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0009065462839047746, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0004161603469287444 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.000983708450751863, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0004420715282406731 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0026091624396139845, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0007993813642794688 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.002187358356350872, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0006548878815934947 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.002337297608841716, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0007032854409325233 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0028561523161821077, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.000870682583927747 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.002361092427287286, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0006961516518425747 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.002540252346941857, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0007562653583340974 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 6.009065394749386e-37, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 1.386737757665829e-31 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_0.json b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_0.json new file mode 100644 index 0000000000000000000000000000000000000000..b9289ba3c5da01629517bfcd7e976af53abfcbfd --- /dev/null +++ b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.324, + "acc_stderr": 0.014806864733738859 + }, + "anli_r2": { + "acc": 0.338, + "acc_stderr": 0.014965960710224482 + }, + "anli_r3": { + "acc": 0.3416666666666667, + "acc_stderr": 0.013696658778002519 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.22212270488132557 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.044084400227680794 + }, + "hellaswag": { + "acc": 0.48446524596693885, + "acc_stderr": 0.004987372476207027, + "acc_norm": 0.6316470822545309, + "acc_norm_stderr": 0.004813719952829966 + }, + "rte": { + "acc": 0.5126353790613718, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5951065509076559, + "acc_stderr": 0.01379592700312494 + }, + "storycloze_2016": { + "acc": 0.711918760021379, + "acc_stderr": 0.010472537019822575 + }, + "boolq": { + "acc": 0.5571865443425077, + "acc_stderr": 0.008687668766930827 + }, + "arc_easy": { + "acc": 0.6031144781144782, + "acc_stderr": 0.010039236800583206, + "acc_norm": 0.5353535353535354, + "acc_norm_stderr": 0.01023410454341143 + }, + "arc_challenge": { + "acc": 0.2841296928327645, + "acc_stderr": 0.013179442447653886, + "acc_norm": 0.3003412969283277, + "acc_norm_stderr": 0.013395909309957007 + }, + "sciq": { + "acc": 0.858, + "acc_stderr": 0.011043457699378237, + "acc_norm": 0.766, + "acc_norm_stderr": 0.01339490288966001 + }, + "piqa": { + "acc": 0.7627856365614799, + "acc_stderr": 0.009924694933586373, + "acc_norm": 0.7682263329706203, + "acc_norm_stderr": 0.009845143772794052 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_0_lm-eval_global_step80108_2023-02-15-11-04-01_0shots_backup.json b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_0_lm-eval_global_step80108_2023-02-15-11-04-01_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..b9289ba3c5da01629517bfcd7e976af53abfcbfd --- /dev/null +++ b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_0_lm-eval_global_step80108_2023-02-15-11-04-01_0shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.324, + "acc_stderr": 0.014806864733738859 + }, + "anli_r2": { + "acc": 0.338, + "acc_stderr": 0.014965960710224482 + }, + "anli_r3": { + "acc": 0.3416666666666667, + "acc_stderr": 0.013696658778002519 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.22212270488132557 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.044084400227680794 + }, + "hellaswag": { + "acc": 0.48446524596693885, + "acc_stderr": 0.004987372476207027, + "acc_norm": 0.6316470822545309, + "acc_norm_stderr": 0.004813719952829966 + }, + "rte": { + "acc": 0.5126353790613718, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5951065509076559, + "acc_stderr": 0.01379592700312494 + }, + "storycloze_2016": { + "acc": 0.711918760021379, + "acc_stderr": 0.010472537019822575 + }, + "boolq": { + "acc": 0.5571865443425077, + "acc_stderr": 0.008687668766930827 + }, + "arc_easy": { + "acc": 0.6031144781144782, + "acc_stderr": 0.010039236800583206, + "acc_norm": 0.5353535353535354, + "acc_norm_stderr": 0.01023410454341143 + }, + "arc_challenge": { + "acc": 0.2841296928327645, + "acc_stderr": 0.013179442447653886, + "acc_norm": 0.3003412969283277, + "acc_norm_stderr": 0.013395909309957007 + }, + "sciq": { + "acc": 0.858, + "acc_stderr": 0.011043457699378237, + "acc_norm": 0.766, + "acc_norm_stderr": 0.01339490288966001 + }, + "piqa": { + "acc": 0.7627856365614799, + "acc_stderr": 0.009924694933586373, + "acc_norm": 0.7682263329706203, + "acc_norm_stderr": 0.009845143772794052 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_1.json b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_1.json new file mode 100644 index 0000000000000000000000000000000000000000..1c3c3f205400d689e82a5b15c850ba6870fdde42 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.315, + "acc_stderr": 0.014696631960792498 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.01497675877162034 + }, + "anli_r3": { + "acc": 0.3541666666666667, + "acc_stderr": 0.01381193349957096 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.06724777654937658, + "f1": 0.3333333333333333 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.47759410476000796, + "acc_stderr": 0.004984768912326931, + "acc_norm": 0.6308504282015535, + "acc_norm_stderr": 0.004815882719278391 + }, + "rte": { + "acc": 0.5523465703971119, + "acc_stderr": 0.029931070362939533 + }, + "winogrande": { + "acc": 0.5785319652722968, + "acc_stderr": 0.013878072377497597 + }, + "storycloze_2016": { + "acc": 0.711918760021379, + "acc_stderr": 0.01047253701982257 + }, + "boolq": { + "acc": 0.5718654434250765, + "acc_stderr": 0.008654253415781077 + }, + "arc_easy": { + "acc": 0.6186868686868687, + "acc_stderr": 0.009966542497171018, + "acc_norm": 0.571969696969697, + "acc_norm_stderr": 0.010152943316426265 + }, + "arc_challenge": { + "acc": 0.31143344709897613, + "acc_stderr": 0.013532472099850942, + "acc_norm": 0.31313993174061433, + "acc_norm_stderr": 0.013552671543623503 + }, + "sciq": { + "acc": 0.878, + "acc_stderr": 0.010354864712936706, + "acc_norm": 0.852, + "acc_norm_stderr": 0.01123486636423524 + }, + "piqa": { + "acc": 0.7568008705114254, + "acc_stderr": 0.010009611953858914, + "acc_norm": 0.7589771490750816, + "acc_norm_stderr": 0.009979042717267315 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_1_lm-eval_global_step80108_2023-02-15-11-04-03_1shots_backup.json b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_1_lm-eval_global_step80108_2023-02-15-11-04-03_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..1c3c3f205400d689e82a5b15c850ba6870fdde42 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_1_lm-eval_global_step80108_2023-02-15-11-04-03_1shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.315, + "acc_stderr": 0.014696631960792498 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.01497675877162034 + }, + "anli_r3": { + "acc": 0.3541666666666667, + "acc_stderr": 0.01381193349957096 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.06724777654937658, + "f1": 0.3333333333333333 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.47759410476000796, + "acc_stderr": 0.004984768912326931, + "acc_norm": 0.6308504282015535, + "acc_norm_stderr": 0.004815882719278391 + }, + "rte": { + "acc": 0.5523465703971119, + "acc_stderr": 0.029931070362939533 + }, + "winogrande": { + "acc": 0.5785319652722968, + "acc_stderr": 0.013878072377497597 + }, + "storycloze_2016": { + "acc": 0.711918760021379, + "acc_stderr": 0.01047253701982257 + }, + "boolq": { + "acc": 0.5718654434250765, + "acc_stderr": 0.008654253415781077 + }, + "arc_easy": { + "acc": 0.6186868686868687, + "acc_stderr": 0.009966542497171018, + "acc_norm": 0.571969696969697, + "acc_norm_stderr": 0.010152943316426265 + }, + "arc_challenge": { + "acc": 0.31143344709897613, + "acc_stderr": 0.013532472099850942, + "acc_norm": 0.31313993174061433, + "acc_norm_stderr": 0.013552671543623503 + }, + "sciq": { + "acc": 0.878, + "acc_stderr": 0.010354864712936706, + "acc_norm": 0.852, + "acc_norm_stderr": 0.01123486636423524 + }, + "piqa": { + "acc": 0.7568008705114254, + "acc_stderr": 0.010009611953858914, + "acc_norm": 0.7589771490750816, + "acc_norm_stderr": 0.009979042717267315 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_2.json b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_2.json new file mode 100644 index 0000000000000000000000000000000000000000..0abd296a9166c031990a450ebbc74ee6ef783a91 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.315, + "acc_stderr": 0.0146966319607925 + }, + "anli_r2": { + "acc": 0.326, + "acc_stderr": 0.01483050720454104 + }, + "anli_r3": { + "acc": 0.3466666666666667, + "acc_stderr": 0.013744022550571944 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.2606516290726817 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.044084400227680794 + }, + "hellaswag": { + "acc": 0.4737104162517427, + "acc_stderr": 0.004982879340691406, + "acc_norm": 0.6329416450906195, + "acc_norm_stderr": 0.004810175357870948 + }, + "rte": { + "acc": 0.5415162454873647, + "acc_stderr": 0.029992535385373317 + }, + "winogrande": { + "acc": 0.5966850828729282, + "acc_stderr": 0.013787257285896241 + }, + "storycloze_2016": { + "acc": 0.7258150721539284, + "acc_stderr": 0.010316062787590001 + }, + "boolq": { + "acc": 0.5715596330275229, + "acc_stderr": 0.008655028561519765 + }, + "arc_easy": { + "acc": 0.6216329966329966, + "acc_stderr": 0.009951575683331949, + "acc_norm": 0.5921717171717171, + "acc_norm_stderr": 0.010083950240041223 + }, + "arc_challenge": { + "acc": 0.2960750853242321, + "acc_stderr": 0.013340916085246254, + "acc_norm": 0.310580204778157, + "acc_norm_stderr": 0.013522292098053059 + }, + "sciq": { + "acc": 0.894, + "acc_stderr": 0.009739551265785133, + "acc_norm": 0.871, + "acc_norm_stderr": 0.010605256784796577 + }, + "piqa": { + "acc": 0.7568008705114254, + "acc_stderr": 0.010009611953858917, + "acc_norm": 0.764961915125136, + "acc_norm_stderr": 0.009893146688805306 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_2_lm-eval_global_step80108_2023-02-15-11-04-02_2shots_backup.json b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_2_lm-eval_global_step80108_2023-02-15-11-04-02_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..0abd296a9166c031990a450ebbc74ee6ef783a91 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_2_lm-eval_global_step80108_2023-02-15-11-04-02_2shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.315, + "acc_stderr": 0.0146966319607925 + }, + "anli_r2": { + "acc": 0.326, + "acc_stderr": 0.01483050720454104 + }, + "anli_r3": { + "acc": 0.3466666666666667, + "acc_stderr": 0.013744022550571944 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.2606516290726817 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.044084400227680794 + }, + "hellaswag": { + "acc": 0.4737104162517427, + "acc_stderr": 0.004982879340691406, + "acc_norm": 0.6329416450906195, + "acc_norm_stderr": 0.004810175357870948 + }, + "rte": { + "acc": 0.5415162454873647, + "acc_stderr": 0.029992535385373317 + }, + "winogrande": { + "acc": 0.5966850828729282, + "acc_stderr": 0.013787257285896241 + }, + "storycloze_2016": { + "acc": 0.7258150721539284, + "acc_stderr": 0.010316062787590001 + }, + "boolq": { + "acc": 0.5715596330275229, + "acc_stderr": 0.008655028561519765 + }, + "arc_easy": { + "acc": 0.6216329966329966, + "acc_stderr": 0.009951575683331949, + "acc_norm": 0.5921717171717171, + "acc_norm_stderr": 0.010083950240041223 + }, + "arc_challenge": { + "acc": 0.2960750853242321, + "acc_stderr": 0.013340916085246254, + "acc_norm": 0.310580204778157, + "acc_norm_stderr": 0.013522292098053059 + }, + "sciq": { + "acc": 0.894, + "acc_stderr": 0.009739551265785133, + "acc_norm": 0.871, + "acc_norm_stderr": 0.010605256784796577 + }, + "piqa": { + "acc": 0.7568008705114254, + "acc_stderr": 0.010009611953858917, + "acc_norm": 0.764961915125136, + "acc_norm_stderr": 0.009893146688805306 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_3.json b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_3.json new file mode 100644 index 0000000000000000000000000000000000000000..374a97008dca04c73fff269d6dee93ad6e7e20a0 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.319, + "acc_stderr": 0.014746404865473472 + }, + "anli_r2": { + "acc": 0.345, + "acc_stderr": 0.015039986742055238 + }, + "anli_r3": { + "acc": 0.355, + "acc_stderr": 0.013819249004047303 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.06724777654937658, + "f1": 0.3181222134801993 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.47779326827325236, + "acc_stderr": 0.004984857671187105, + "acc_norm": 0.6338378809002191, + "acc_norm_stderr": 0.004807699539973427 + }, + "rte": { + "acc": 0.5595667870036101, + "acc_stderr": 0.029882123363118723 + }, + "winogrande": { + "acc": 0.5651144435674822, + "acc_stderr": 0.013932814110418024 + }, + "storycloze_2016": { + "acc": 0.7231427044361304, + "acc_stderr": 0.010347112890276929 + }, + "boolq": { + "acc": 0.5865443425076453, + "acc_stderr": 0.008613059239942641 + }, + "arc_easy": { + "acc": 0.6308922558922558, + "acc_stderr": 0.00990198741024273, + "acc_norm": 0.6026936026936027, + "acc_norm_stderr": 0.010041053078884286 + }, + "arc_challenge": { + "acc": 0.2883959044368601, + "acc_stderr": 0.013238394422428182, + "acc_norm": 0.318259385665529, + "acc_norm_stderr": 0.013611993916971453 + }, + "sciq": { + "acc": 0.903, + "acc_stderr": 0.009363689373248114, + "acc_norm": 0.893, + "acc_norm_stderr": 0.009779910359847165 + }, + "piqa": { + "acc": 0.7584330794341676, + "acc_stderr": 0.009986718001804463, + "acc_norm": 0.764961915125136, + "acc_norm_stderr": 0.009893146688805308 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_3_lm-eval_global_step80108_2023-02-15-11-04-03_3shots_backup.json b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_3_lm-eval_global_step80108_2023-02-15-11-04-03_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..374a97008dca04c73fff269d6dee93ad6e7e20a0 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_3_lm-eval_global_step80108_2023-02-15-11-04-03_3shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.319, + "acc_stderr": 0.014746404865473472 + }, + "anli_r2": { + "acc": 0.345, + "acc_stderr": 0.015039986742055238 + }, + "anli_r3": { + "acc": 0.355, + "acc_stderr": 0.013819249004047303 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.06724777654937658, + "f1": 0.3181222134801993 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.47779326827325236, + "acc_stderr": 0.004984857671187105, + "acc_norm": 0.6338378809002191, + "acc_norm_stderr": 0.004807699539973427 + }, + "rte": { + "acc": 0.5595667870036101, + "acc_stderr": 0.029882123363118723 + }, + "winogrande": { + "acc": 0.5651144435674822, + "acc_stderr": 0.013932814110418024 + }, + "storycloze_2016": { + "acc": 0.7231427044361304, + "acc_stderr": 0.010347112890276929 + }, + "boolq": { + "acc": 0.5865443425076453, + "acc_stderr": 0.008613059239942641 + }, + "arc_easy": { + "acc": 0.6308922558922558, + "acc_stderr": 0.00990198741024273, + "acc_norm": 0.6026936026936027, + "acc_norm_stderr": 0.010041053078884286 + }, + "arc_challenge": { + "acc": 0.2883959044368601, + "acc_stderr": 0.013238394422428182, + "acc_norm": 0.318259385665529, + "acc_norm_stderr": 0.013611993916971453 + }, + "sciq": { + "acc": 0.903, + "acc_stderr": 0.009363689373248114, + "acc_norm": 0.893, + "acc_norm_stderr": 0.009779910359847165 + }, + "piqa": { + "acc": 0.7584330794341676, + "acc_stderr": 0.009986718001804463, + "acc_norm": 0.764961915125136, + "acc_norm_stderr": 0.009893146688805308 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_4.json b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_4.json new file mode 100644 index 0000000000000000000000000000000000000000..d552572c4d050c4470d865e408b396f760319ef4 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.332, + "acc_stderr": 0.014899597242811492 + }, + "anli_r2": { + "acc": 0.368, + "acc_stderr": 0.0152580735615218 + }, + "anli_r3": { + "acc": 0.3491666666666667, + "acc_stderr": 0.013767075395077247 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.33712121212121215 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.4765982871937861, + "acc_stderr": 0.004984313205791442, + "acc_norm": 0.6384186417048396, + "acc_norm_stderr": 0.0047947648436852865 + }, + "rte": { + "acc": 0.47653429602888087, + "acc_stderr": 0.03006330041190266 + }, + "winogrande": { + "acc": 0.580110497237569, + "acc_stderr": 0.013870943986310395 + }, + "storycloze_2016": { + "acc": 0.7300908605024051, + "acc_stderr": 0.01026541350322146 + }, + "boolq": { + "acc": 0.5691131498470948, + "acc_stderr": 0.008661108320775374 + }, + "arc_easy": { + "acc": 0.6304713804713805, + "acc_stderr": 0.009904325878447319, + "acc_norm": 0.6085858585858586, + "acc_norm_stderr": 0.010014917532627819 + }, + "arc_challenge": { + "acc": 0.2960750853242321, + "acc_stderr": 0.013340916085246263, + "acc_norm": 0.3250853242320819, + "acc_norm_stderr": 0.013688147309729124 + }, + "sciq": { + "acc": 0.908, + "acc_stderr": 0.009144376393151108, + "acc_norm": 0.9, + "acc_norm_stderr": 0.009491579957525044 + }, + "piqa": { + "acc": 0.7589771490750816, + "acc_stderr": 0.009979042717267315, + "acc_norm": 0.764417845484222, + "acc_norm_stderr": 0.009901067586473885 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_4_lm-eval_global_step80108_2023-02-15-11-04-02_4shots_backup.json b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_4_lm-eval_global_step80108_2023-02-15-11-04-02_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..d552572c4d050c4470d865e408b396f760319ef4 --- /dev/null +++ b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_4_lm-eval_global_step80108_2023-02-15-11-04-02_4shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.332, + "acc_stderr": 0.014899597242811492 + }, + "anli_r2": { + "acc": 0.368, + "acc_stderr": 0.0152580735615218 + }, + "anli_r3": { + "acc": 0.3491666666666667, + "acc_stderr": 0.013767075395077247 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.33712121212121215 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.4765982871937861, + "acc_stderr": 0.004984313205791442, + "acc_norm": 0.6384186417048396, + "acc_norm_stderr": 0.0047947648436852865 + }, + "rte": { + "acc": 0.47653429602888087, + "acc_stderr": 0.03006330041190266 + }, + "winogrande": { + "acc": 0.580110497237569, + "acc_stderr": 0.013870943986310395 + }, + "storycloze_2016": { + "acc": 0.7300908605024051, + "acc_stderr": 0.01026541350322146 + }, + "boolq": { + "acc": 0.5691131498470948, + "acc_stderr": 0.008661108320775374 + }, + "arc_easy": { + "acc": 0.6304713804713805, + "acc_stderr": 0.009904325878447319, + "acc_norm": 0.6085858585858586, + "acc_norm_stderr": 0.010014917532627819 + }, + "arc_challenge": { + "acc": 0.2960750853242321, + "acc_stderr": 0.013340916085246263, + "acc_norm": 0.3250853242320819, + "acc_norm_stderr": 0.013688147309729124 + }, + "sciq": { + "acc": 0.908, + "acc_stderr": 0.009144376393151108, + "acc_norm": 0.9, + "acc_norm_stderr": 0.009491579957525044 + }, + "piqa": { + "acc": 0.7589771490750816, + "acc_stderr": 0.009979042717267315, + "acc_norm": 0.764417845484222, + "acc_norm_stderr": 0.009901067586473885 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_5.json b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_5.json new file mode 100644 index 0000000000000000000000000000000000000000..61f2e179efa9aee0aba89444f6db0358b079e55c --- /dev/null +++ b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.343, + "acc_stderr": 0.015019206922356951 + }, + "anli_r2": { + "acc": 0.332, + "acc_stderr": 0.014899597242811478 + }, + "anli_r3": { + "acc": 0.33166666666666667, + "acc_stderr": 0.01359683672948518 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.22512077294685992 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.477096195976897, + "acc_stderr": 0.00498454354093234, + "acc_norm": 0.6394144592710616, + "acc_norm_stderr": 0.004791890625834213 + }, + "rte": { + "acc": 0.5306859205776173, + "acc_stderr": 0.030039730592197812 + }, + "winogrande": { + "acc": 0.590370955011839, + "acc_stderr": 0.013821049109655472 + }, + "storycloze_2016": { + "acc": 0.7247461250668092, + "acc_stderr": 0.010328538400500572 + }, + "boolq": { + "acc": 0.5896024464831804, + "acc_stderr": 0.008603488048617521 + }, + "arc_easy": { + "acc": 0.6308922558922558, + "acc_stderr": 0.009901987410242733, + "acc_norm": 0.6077441077441077, + "acc_norm_stderr": 0.010018744689650043 + }, + "arc_challenge": { + "acc": 0.3046075085324232, + "acc_stderr": 0.013449522109932487, + "acc_norm": 0.33361774744027306, + "acc_norm_stderr": 0.01377868705417654 + }, + "sciq": { + "acc": 0.916, + "acc_stderr": 0.008776162089491132, + "acc_norm": 0.909, + "acc_norm_stderr": 0.009099549538400243 + }, + "piqa": { + "acc": 0.7584330794341676, + "acc_stderr": 0.009986718001804456, + "acc_norm": 0.766050054406964, + "acc_norm_stderr": 0.009877236895137434 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_5_lm-eval_global_step80108_2023-02-15-11-04-03_5shots_backup.json b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_5_lm-eval_global_step80108_2023-02-15-11-04-03_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..61f2e179efa9aee0aba89444f6db0358b079e55c --- /dev/null +++ b/4b284b21bc4seed4/evaluation/rankeval/4b284b21bc4seed4_5_lm-eval_global_step80108_2023-02-15-11-04-03_5shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.343, + "acc_stderr": 0.015019206922356951 + }, + "anli_r2": { + "acc": 0.332, + "acc_stderr": 0.014899597242811478 + }, + "anli_r3": { + "acc": 0.33166666666666667, + "acc_stderr": 0.01359683672948518 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.22512077294685992 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.477096195976897, + "acc_stderr": 0.00498454354093234, + "acc_norm": 0.6394144592710616, + "acc_norm_stderr": 0.004791890625834213 + }, + "rte": { + "acc": 0.5306859205776173, + "acc_stderr": 0.030039730592197812 + }, + "winogrande": { + "acc": 0.590370955011839, + "acc_stderr": 0.013821049109655472 + }, + "storycloze_2016": { + "acc": 0.7247461250668092, + "acc_stderr": 0.010328538400500572 + }, + "boolq": { + "acc": 0.5896024464831804, + "acc_stderr": 0.008603488048617521 + }, + "arc_easy": { + "acc": 0.6308922558922558, + "acc_stderr": 0.009901987410242733, + "acc_norm": 0.6077441077441077, + "acc_norm_stderr": 0.010018744689650043 + }, + "arc_challenge": { + "acc": 0.3046075085324232, + "acc_stderr": 0.013449522109932487, + "acc_norm": 0.33361774744027306, + "acc_norm_stderr": 0.01377868705417654 + }, + "sciq": { + "acc": 0.916, + "acc_stderr": 0.008776162089491132, + "acc_norm": 0.909, + "acc_norm_stderr": 0.009099549538400243 + }, + "piqa": { + "acc": 0.7584330794341676, + "acc_stderr": 0.009986718001804456, + "acc_norm": 0.766050054406964, + "acc_norm_stderr": 0.009877236895137434 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48a5d0754c2e5f0b1a03c77a9e721cd7dedce027 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5985ff37d824a6c50baa77b2629dbd43c466cf4352c9de30e11cd974037bcc63 +size 199058647 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecba623669e7ad34ff4ef2b6cb3043339b59adb0 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8061a6771e3c5284c6e524d6a271cd5cefa349ee919542a1d8388877dc7daf88 +size 199058647 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb2b5e56d833067dcf1bbf64d62774ace6db5cbf --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8af222758ec94d5aad1c47e94afcc1e15e40a1bf13350438a54a70cc94a9ce58 +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f984d27a0035848a2040edbbb5bf2f262e7ae252 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f59846ae7417eea6c648155e4da11efdae9c3e0f3df3a3f50754b6da0f60b99c +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a3cca2d69f55e57f649186e32ea12a73b7db947 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69bd2fdcf6d6aed276d5d5342fade728a1b9ed4b871faef7691adb805fea9831 +size 199058797 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdc3bfe3965a73216f0a8e22228f4b2a5cf05178 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91adcf4ee9879d43b18beaa436aa782b3c871589872127372e1e96e19ddc9469 +size 199058797 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ac440e0ccf0cdf5e8f62bafbb4539915c27ca49 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:296c6e8396e47312d4bd928a92a8d20ed8cb7581d8569a14377d5e99d0445321 +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e8a883a3a377e07fede4e11a01f36b64cdc9b4d --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29ab38b797dc9c35d8f27038975f2674eb2b5df3834cdd747f654e42bce1018c +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b36e46288f0e95e4552c3d92f055da60835a9da2 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06aa86d79fd9f9e97055094f4bae583484666d19aba56adba3c078fe4c80b3b3 +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bca7e43b1aa47e24cce1b61b32b27c9a76bb2ab3 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ad3c5df61233095d988bd56b3c398bb084c0743736edcf16302da7b2c5cee14 +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62421f28983688fe3c165dc30da808087f51c4be --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1aa8be3e0f34bee2506b4fb35b505b7319ba81ca15872cc4f72ae7e900d7faa8 +size 199058797 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2d60ef365563f79d35715fa16e0972afb5f682f --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6094d49f78bf16a5c78de9d620d1a4e26d3ffeece5c384ed44ef79263c707dfd +size 199058797 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65d3fc3b87db05de0495f0cca0dc142695f04f71 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5755c15db6b3bc532736ede71f3a53e382dc1ecc8078abaecc49bdefd162a30 +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da4503e3ac6065afdee077c9ef36fd9b9cf09dbb --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05dd46feb03078198356d96e92b1cc187e2655f183c5f66cbf96f015099a189f +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22168abbf285a066aedf2456eaebac74f079b196 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5c61d179c54f295203ca389984debbfd0c2ff82f3a37f99c3d781da7c898ac4 +size 199058669 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..106849f7f05b3b266d7d2ef0bb849fc72005e7a0 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59587605566f8b3f8f7c19489322e378e297a85dfd9b1db6a0e4439445a80fe4 +size 199058669 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08b8ec49311c26119500f5eac19f968f537a8de4 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:894824553e11f5e7d56ac18f2cbf72c7647cd403f0886b9181f31f1f376b6822 +size 199058797 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f84a3f2191f5fdc01f2ee6d46f9fd3e18a7d6219 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8d7584504749dfaa374af5e7918bfcfa53cfbdc36a2b566eae8572e7f78b589 +size 199058797 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4929d9fc777d5159f75caa8ffa41697229a0a625 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:004616c25ed80e0c479452e87b2255fb17a39b7ada0a3d3613caf55faba0816b +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28bb1a5e68f37c86ab9262e8db68cf554026618a --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca5de6fbfa84bbe16af12a94f25988002754aa92eb7b838c1ef8612759ac3d3f +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d74abb63bd17045c9d0e9f33a81725df4c4ae653 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6270eade470ba80a2a7319b284a8480679f9e0b2e4c0dc17de727040872c132 +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c0205bf813206a16203284ade926e3dc567cdb2 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:526960e43fd93d276f0568e8ea15b20b9aaefb59a552a24c8d03759c6a9d817f +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9eb812b7c14c500742c50895c58cb46e90b34d7 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5351fe1272c8566a83da08e62dc83dec3fabd6a570bf919ec92c3797465a8f13 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22dbcc90a0699e707c7ce7adb1ab3987895ee905 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7562ab235d0aaf55e6a65faa1880bca6d9c4fc4841333c4a08d9ebaa381e9b65 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e79a9588d2d8214677f052eb6f0b78be9ee33abd --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:467a316bca3bd6251b9d38597edaf8a49d902268a6828a4209caab95fc3a409d +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26d12bb9d49abaa43318c745ab416065c7d765ad --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65994e452cbd5bf60567f2240d6fc1645f679e9dc9a502966b240fc233f92717 +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fec38a69ac00bb15729791bab112348d0ddbe8c --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3be7d0cf6a60aaf0e90328ae5bc56271d52865268c3be6b274b51805adc6386 +size 199058797 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8442d35c3b1fe87fc4e404e8fe9707a12cd9c839 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df70ec9a3a64e311e5f413409047b137862284cb8debb7b7ab2b805976dee3cc +size 199058797 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d4994f957a8c75815abdbd8514b57370899ddc2 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32083539ce10677ed916fd21be85f35bde761b6495db8ee052e30de416dfc277 +size 199058605 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64cd57eecd3d5d9ae73bdddce268c71d8b44721f --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed8602e68f08423fc418b6b100096a569dad72f7c449774c6ba717fa9035f611 +size 199058605 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4300f9d11e50cfa0cc45e45f2070d95cc62189f --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f624f1f4e65fbd4bb6b3c4d5f1623d75337cc2174b4c81de8ccfbbe4589b2615 +size 199058669 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..360d505764d890e9a5dea579e4abf47d0f794f13 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:549c1c0a486a19249d0f702e9902034283725afdeb0d670c03a1c191b72ddae6 +size 199058669 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b329506d02c05cb7156bfcbd861ed64087ffa62f --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db48cf59240a01b904eba18ceeb3ed658b930729c5e5f18e1a39ed12ee87b193 +size 199058797 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd249f3316640ffbc7b12b543cbaa4b7379398a4 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d18e29e715be50e268566484ff2df31a73feacc90132968cf451f981a47d37b +size 199058797 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c84a3cfb1215d56aa9390f226211aca9bde2bc2c --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec8f2ab8ae2c96b64715a84808b71b8e24fc04467a0b70757ce2eefee670dfb2 +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c0f6721b25d6bb9a64815518a8a1a0d2699fa08 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4d7ed64f51e690f230b477d1cca7c6fa0ae5eec398b7d22389a6c697c69eeb6 +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d71a3f3057fabd77931a2850a5c77b2efa3d5b6 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:435d1d47273d723a146856a78952f66308ba72ee354edc9af4b96d719488c97c +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24f5a8122bf2d1ffdb4538ce889cc6a1343f2251 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:083d674c36c5eb89560706d6f0ad895e993e17471e4bcf6ee4e8b7d7606fda74 +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a390e759e84e9c525fc2ade4285f5e84897dddc4 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a7595f09443378a5aebf5f60d8d951ed318c5447ed10c6fe686ea612ff393fc +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4104e9b72b0a3c2d48b0b1830d4eb2bbfb8e2890 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d08bce62c312f3bda6eaec4deb9419c2dface0631377073876464efd6e0d6c6a +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2990280d80328a9c394f3fefba7ef71f24dedc5e --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce00e99cf5018db47d9917d78409b9c6c9c07b6042f30d6b4af4942a051ce7da +size 199058797 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab1c03800b83492fbd947994dab6e006fe7e76d0 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d677d633ec7b5c2897320ad9d890ccd7934a737fb912ff07db23fadc9a8d527b +size 199058797 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9399dc3d86d057a00f203922bf496006e0ae2ae2 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd69ee989a7324f84cb3fe562c17b7ed4ea8dc07850793ebe892f7d64bdc0e2e +size 199058669 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..583cb88ff0df393f9622a48b09b3fdd8ab895969 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d30c600361988303eb794ed69a90c3c8f74d6525abc1694cb74d2bc2529623c8 +size 199058669 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22fc67773b65e3e21d90a6d3acdd1547ee062ec5 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f722755b5f397457a0abbcc058073fe2c9be6c2f95abee4ba2acbdba6dbd8a8c +size 199058850 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9da786ed5f9c347aa874c572e8db864132c7bbbd --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5aeb377a82414b5ccfd9ffa8911cbd4465007fded4e4688024731650167a853 +size 199058850 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57b87bf0b53af07fd1e37ca3e79a69b47a30e5c9 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df46ea7ae76a1af0e5f339fb4f8391c739786eb2ff25bea9ee4da89cd5df4da1 +size 199058669 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55dc6f5a262748678c55545ae9087609a81fb7d4 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39925709d75413f8b7abba7128e242ae3077bed2ac24e1ad3ab85660fcddf033 +size 199058669 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f60dce2286bbb09319521877ba92e31d421d3fd6 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef3c7545aa7e34c195d2824cae34e4d7794bfe66a76b527badf8ec5fb669259b +size 199058797 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..954cee810ff3351a11de43bb311af4454d081cf8 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18d8041e403908ae89d3981d578635930700903fb8eba75af1237fd8f41f247e +size 199058797 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dee39228e6a4bf89686160cc7fc92eecb878620a --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d054fef314466e5c73b18790d3b7c0bc72d4a5fb0b4dc362afcfa89faf3d284 +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1796cfa23e407fe3ade5a01109f08e40fe186630 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbe141ef93f28c12898b026a14b653bad08612f999e41e6dd6155f1f3535e7bc +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce1cb8963dd0ed22f95505629f5a94c119ae4f68 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a36684ea83924b74e84e989a35adddcf61d236bdbd91d24764539a4f585c9c6e +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a481deb45560ebbee4d3f0cdd5269d9abaeb9433 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc40a9b3ae64af45a1f759e4edfae0aae8f0944496a5ac269628e552ff5c45da +size 199058733 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75f7de728edf4356e2bedfad716dd56653d22a2b --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d73bb25c4cdae4b66ad23a31f538f43025086b8299833e4468dfc1d921ca6e2a +size 199058669 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c9ec7bacd15324cb5d9ef10b1f7661bd872afbc --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59dfeca2e58c0106cae828a9fb38bb07e3d3aae79f1746c005515e4484299d02 +size 199058669 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb4afbaacc9b05f93ea715bd8a43e31fc8e376dd --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c76f8df376f5c9346d963f4d23020d3d68bcace5f97fbacb7c039e68466d97fa +size 199058925 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ce50b3a21a4684b87b60e8051832bd5992598ee --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b523fc19daf2fb931ad4d70d02455309d58168e049867dd3124e1068fd168fa9 +size 199058925 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9044d4e3fb0dfb8e7043c7ab14e8988ec99727a6 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32e4242aff107f8e0ad431875fc6404571ebc8b4c4b45e5d8c5a7fcc65f14b63 +size 199058605 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80ce10c01cc5c868285d10342f8b94a360c217c2 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1625b25215fbe279db8b571151fca5adc591471d61d102b959eb208fc0bd74a +size 199058605 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f06534c2774cdca63d12c0e1efc59c605e4cc45b --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:898baf5c088752a14746d5fc901f40f0b4ea3435789e5fcf170a48d3c5bb29dc +size 199058605 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82c8dc5a7f8498f42166ce8403bc1ddd93d43b3b --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce6d5ef9319910759d1fab07dd00de7ede607b2b20a438da159df5a0e4b69502 +size 199058605 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f706bfa0734879481348472df171c232b678075 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b574f89a35eb1c287e4264d88386ecf3bbfc57010686074fe0b2e6dabe5f547b +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a54ba0fcd1bea09cc3e1b690b3468950e7bf155 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c241a3978ed4431e5beccba87907bb104633da554eee00a93a86a4844c2e1338 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a399537b6cc828e424ae8ed6f660d1d01a249b42 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:580a069ea8520cbfb68902ba45ccaa256183d4579aecbcb56f582e6074c8a0bd +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0585829df9e4cf70c8e00e7de4dc94ab69f2d086 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd94f10d95574eca391285342d5be3c5d44b599770c77684587536383fc02d11 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca8fb5331aebe9eabc0ea7438e5cadc08b84d74d --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c2977bad667c6e6fd45b0eebf48a74a0dd4f675296b35a47500245fdbed26ba +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5355e0112df4aed1d45613d8c2c22f8bca9c8ef --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7497c1a8a764e174b2a4537a32660a7977937e83b7d448bf3b2a6ec881004657 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e47ec51cf7ef64348acd7bbc6576d8ce5e0fbbac --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ae4d2d850a75825e48441b0b1d1ceee8c4db3a2329c3ee8b4db4abce55659dd +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..719fbf7a1c60318abef5089ad4ab521f2f5dc2e7 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a075c76604861be863da11572bdafe76a78c03a276a3c290237b6d603cfc96b5 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c4c421a91a20a2bc23f3f268773b6700a1c0251 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4b33161f21f96fac4edfc7b739abf4d8a43b935b6219639040dab27839ff18b +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2a1199deb9bf98c9cab633c157990f7b690ccae --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5c442fd4a399813b6c77f286af1b55e4829969faf8a95079061eb317a5cea5d +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fc0178d0a1a76539805209908d584dd075c3a68 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2d5252d93407e9820b5f2a331aa751ecfded7d1dd085164f55a61eb30c5fbaf +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c23361ea9a517e7aa329945802134cad02844a62 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7810e6898b7909bd634d9cbdb21e16a69d3d0ccf89c0e6a052eea4f13dfa1b2 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f37bde36a4ceaea0f3c3d88fe98a5965b0bdbc08 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb2f11b6088e88ba5046d5b2825ed80d92a2700fb061484ea6cfa637779b5abb +size 199058978 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87695ae1c5841e7fb31b38e722085753f07dfc93 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e24e46db6484b92cb5b6f1939bb838b7b79039b537e70c7241461a6dd47d82db +size 199058978 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fac87e8734a5a3978a165e4d9e5a3b8d717aa8cf --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a487b8568b5a2175ae094f4a12826823a15b9d7f850222a23f1677e9f8f14ff +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ee9c315f5a7775c45c6feb73ff421e30b895c8e --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49521a204e46ba7af51182247837aa6c74e40bdbb7fd16294843bff563925322 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..929835d1fc6c731ee5fd9921bc243457880fcbae --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47183816e181193b646cd888efb4b8e679ac9cd77d3050136d68a51ba852f4da +size 199058647 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a98943ad982609380857377992280821e29696b7 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebc3b948342147c349d61e53083446be740fc265d306142111bec16499234dab +size 199058647 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..935ff1791bde212b893908001124292c3f9f7e63 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86c3da7c3b2b2a9f1c0c040f3e2eea798ceb66c3f91d7d5c064a4b3902582831 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..231375bb02c3f70c6efcfb7012160d71f5406707 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97e4d3cb809b6ac92f6b513fded0ce683df07c24fdb19c68c195aaccd76965a7 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9882e00618932bc965cff86be17e393276daf5cc --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2f901c6525ff8371da65b544cd203491f1bcb46068a0cd9fcc734cbe1800601 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20d0927a0eb02a1d7084b00b5c93601d1744c1e3 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:246982b143f8f030675c333b7fb341946b388e7170910cbeb74b9f085bd4fa55 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59ce14133837666d081c47c1e0b95413d30dd2c8 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31775d1418775ae0b121f3e65a35c45f865006dc8387457a312f2f30be27b129 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..228833e99d1e894c4098968122a038e54bbafc10 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59164104211db8c541390a816d71649b5d12410c8676a7702da194afbc9a0b11 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d25c4189b69d3176e6cedaa221e220f8a180401 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52e34d3d4f956af8138d7f23728c238281c847ecf356aa67b7a997e39c80b365 +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e53feb937cec40664d6fc32b75fd335451d3f9c1 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ce25425d43a6aab1a80c61e107abee4bf99dd3d5b49c34f2fc1b732c44e50d4 +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7da042e73ebd8c1ad062a0572c6b01c42c4f0b50 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49f80e86f8af8732315f8f437e4671f396ffbdc95d351e36233a374b2edbc870 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ecd98be3e76d7a66946e50791f6a95aba4e9de8 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0174d852a2ea78ab5d073952831faea16d7055c2673279c8cd72759d4ba8c5c0 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab2b4afe90224c62f25ca9278b0fa40d95dcbdf0 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b71d2896c1cdd897e91989116980f14e9b0bdc89891571d50c6320b7273adba +size 199058850 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84493a6ec6579c71145c15ee24acf37b36831925 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e41070645ca9875e3e769845dddd19ef0f97ecf6d20dfff2e7a1cf84612ed080 +size 199058850 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02ead9540f1e2248f0e8df026e2335bc14249c6a --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff2685c7661fbe8acb2b17540a7d8f03e28ebff80fc177f0a6ebb5dece645535 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcaa0adcf9ba1680e6f5b2609c5085e377610144 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aa390d48838bc70e6c14d7340b95275f547b8405e0a27f70605a8c1a2b2a50b +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..241fa57085f86aaa32f389715927098d4fe9f2b9 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09d768bb69cbca731da782371df0e0deaa1da6f8c3adc5a4a7e64dacab9f3021 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf7f875b6ffe82a453b992178f1c82674f4a5d52 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95709a2426fb0da8370b9ccd1122724a263536b853952309eda447baae673cec +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86f3415686f10ee5c89946f07eb42810e9a29eae --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca1a6e8326aacafea959d9b2bdd6e34463b2942322fee503d3a1682d64fb5fc9 +size 199058594 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91cd09345ded8e52f21d3851be2be7c16701a0f3 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:073f08d09a929c19cb350a54b5af677a561d31a1963ddb6df8f830aae8d9fa5f +size 199058594 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..251e5b749624642e40c67d3ac858f80edf019fb6 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c5d86ecedae06369d96488d912922a92633514846031baf25fef18d2ea74942 +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa5686da8308afea302bf28aca9de0b18aaca24a --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:379663cbe3fa820e09272110aba2cf311e1b06848477ab239fd574cac58ab8b0 +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05cd1199a247651e555a3e638a245b58b7fc7cf4 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be46698520250ec88f3df50f35a90645c8b5464c76d0f85bb66efd52f56dd953 +size 199058711 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bea0da64350c71de7d965a6f8c1cafcc3c44017 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeca70ff1688c36b875d980696882b8a2e721f60475b161ce469dd9fd659f658 +size 199058711 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa65bce037867c700d5081afab71508a4c183aa0 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8121fd2623d45dfbb84e8c02d483fdf5db651094ed16b253d3c8194bb5dc7db7 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f76a5855a75651a01be2e507eb302b0bc364fdde --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e296932dc87756d0d50bd281d384dfdeab33a8d2a77b5d3d5de73fe5a0a0970 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc8bcea35b9aebf68e7ad19ee6118cf13d0332d2 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c453ef6d9cd39781733dfb916380e9b14955d636736da2ef2aa111bdcfeaab5 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7935211d3e05d86f6542bcc69e2ffe64165295fe --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7182cb4d816552b089aee15bbfdf4098ec105e76edcd781191be25e79d991200 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f84ed994be62690e98a2d200cfec93e4b2ffec8 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06ed7d3f4bebc5155206b79d5de0699f925a71aef3028b2157928b41b1012393 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6406fb653e586a1879f78414bb4b39f4322160f4 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb1bc82412a062dcda796ec563218b1e473f83dbd7acbafc7e40ddcfbd37bfaa +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0755bba65d47fbdf532ea256f2d06badc21761bf --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15ed6cd18b5d6ee035c7c9db44d2a50057c8742648643a5e3818bf7084bd7f6c +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b6545298f53170d294c9688bef71cc4b91735b2 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89896962e8eed5662c77dedd63f7859a8fa3751fd346ab8c0ec7f2351d5298b8 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5910ce30b2f85cf45538bf4b942cf607021d0c7 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a7d90a9313b1d33e883f76ee27944c3d3311e4960d261cf971c667a6f3a17bb +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83a0909e8c90c5925e4c24bbb4b0d104f2447261 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b3b4f8ad3f5da80c9a7fa3ec8b7d32691e0314a3837f01464a9cde6e1577bad +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c245c8d5fb33bd47d2d9f0672549407cc042da7a --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6ad83ca17f3d4e444bd892c3d7fa99da41300c0c3b873e5b185a2c91303737e +size 199058594 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5381a12b3a0e61feda161d798c3b0cb2984ab699 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c924dbe822b368d9c673a55a60f2222b3b0d05243129cf50f99000dbcc6dc6f9 +size 199058594 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e682a58a2cd3004374e9bfb0f5d349af2b39d85f --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:916d090a0fa98c9500c5a3183b9a4dc5fc6ea524c9c6fec4b4fcf51ce2310993 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9b7bf2142b4d0f5ce2ebae0eb67998e605ac400 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5372cffb02487953dc1082c376d589283f20c603549f52ada0ffd2f71042f44 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f844e56c424b885bd1dd68fff545df01b366b2a --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f379155230357f526d75211a105b76d1f259180e0590c40b81c74c4a6f554ac +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..687adf7bb6c0131cca536f919a04223b4f8d3fab --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55e92764eddd05de35641a2a22b92f87411c414265cd16ad86b0826dcbf43c9e +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e29c1e64609ec1cb3ec468e6dea011f5d3cdb7a --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04700b9c1b8c3a1a21cfae005c581c9e10202c91cd8573d4331ab4ca9f316aaf +size 199058850 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e4224b0a16836cb506d92994172a29cf3b642de --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87f903a8a6d1914b9899818d152e415c24fadb512511accda3878a371820d0d8 +size 199058850 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc132786534cb62ad10094ab57fd83cee63e033d --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af423140f74cb4d66ab03d00c5be03ec09b6d152e97b4456030085c4b033e1a1 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98014cba489d1e807107a6598ef24d33685d7884 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86b2227012fa9e127517a82a52ca38a0cd9326b0d483a84252a87a1cd4f66329 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6e30740edd47421271bde6c7e06d1354a0fb2dc --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdf2336fdb42ebdb3e984c5a2efec210c39e20e4753592047e6c755e87b0c4e3 +size 199058647 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e3e313a020afca300f4ed6925344d8f241aea1b --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e409d1e02fdd34afab8e52966536cb09616687214e2d115b4320eae574ded1a4 +size 199058647 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4da122b808b04919278da65734e52231a7dfc398 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22dfdc3377936e5a1f00179d2bb90bc73bacbce3ded85a06a57eba766ccd6d27 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d67c54b0de9cab6a00d55097dcfa4b2efb9f0a1 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b71023d746c7da121355355535d2d7f67569e0d473dc68b9ef7790bfef468fa +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..935ee9407b5b336d18c7804875d54c3180350c7f --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75ce3ee3e1ecae0312288f8b90f769b577245b764997654c5d09ff2e6a096650 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccdbd4364a76222b247754dfe5ce85889f1c2292 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d764a322d0bae991bffa13329bbf171a88a36543052484eff354c6203d7b274 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73b19cc806496863b1e4e537bb4fb327cc3bfe3d --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cba827d6cfd6374efc0a035cd1f2d6c3b2586a57ea0574ba4a0a6fe817778df +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc6c67337b48353c7eb271b2ec557e2691c42e5d --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:585b31bd805f972100a357294bab9ca14eeee2f3779140a1d4ab3127a95d8545 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1938f19b24eb66f55041fbfc632901d744f20ca --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:024288c0bab79305a3057861fe8ef10b1bd661aac6be5231f4dcf56698b9ba39 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c8919e08954936487d72871616f4b677367d70b --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15d19df8359bd8adc75633cfb8038b66508ca6ba55827600717993d5955d2145 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f38ba4a4b12845c9f185b06e92922448b07b567 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e83a13dfe5783598faadc5033f436f20bfbd25f81d76c753dad2c26a832da42a +size 199058850 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d99b5864cc6954062ccc93ae22a71326f238d3f9 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82598324103324d75d7c6a2458338c82eaac3112d69c0ec3bdeb27285628d87f +size 199058850 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68fb184ca6c8a5d310a9db4f39a32e019356101d --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38b517a579a8a4ee7fb187e2e686072871e4cceda600c3374728675a9dfc1b12 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..abcb13f46a6cc50133eb435388ab609e67799759 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:821211dc713cf7b08a55d1cc7385cdd0289ceeaa1aa8d514e79b07e1b29f16b3 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..146ead61bced8623949b19a40c7930631c1d6200 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b837a91cbbd6f0384c8cf1f3fec535d4b551f316c774c2fc090aefaab7f110c9 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0193ddfa2431fae49caeb5954082ee3e8cf4a17 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80ca49aa0b04e687a83a023f2ae2420d772bd3067b1fa50367b67fcc975c48f5 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09abecb51f7e0e67be0d0f487aac5213b5e51562 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc132734ea04f7bf2eda41570247df0fa93a41ab5a1012878c2fae46fc85bfc1 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c33c7cf450e96f5068b3e817e1d72dfdb9a6ba6d --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7230392ae78ddab7eb4d4e0285f8646e7fd5cb2436cd390b4ccbf5497d05d144 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42e1a95a04b40651baa84d8d5bf5d0796f67d73f --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:358e10ba558dfdf1065037769cf5629b50ece4a8acb70b5ea69936f4b228a02a +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68fb4b903110a0ac8227b32511797e9ae26888bd --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71c12a6b754ccdfacac05b01ea28d942253e7528c256ee3b8b6fd8d79f638c2f +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62bae8fab6e51b41f112df5d9b262eda2d6306bd --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eef4d84b45999066a0c3d4ed8319ab1c434f6ff562925a32a06b92d6aa4a893b +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ff59955f87eecfc46a581d76f5240e4ceaa2c12 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a89d316c62deabc6f07fefe1d93b9ac5fefe2821c5e1ee9f1bfffc54d91f6956 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94853a09a39024d898d9c72a792c4680c8f9a1ca --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c280eb38f55fa0aaefeeb768632a42ac39808085a4c713c9253ae0ec3e62fb1 +size 199058775 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..998a32f09833f430006c390646b9d75853114bd9 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecee93dc1c9313f64bfdb12cd61f68b1fba8091c2e153351a1fb6ac808252206 +size 199058775 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..478cffc971f8317584a2e02637db73980b5015a7 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2379740e85be87ca5cfd46febdebdda7ba54d6960b06ff17603801a944dbb101 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab3f5a23cb7c8098c8bed64ea965af9f9e40e574 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fa8e845898b155516ee52cf0f41975da01f1708477ed9704eea6c13e4992335 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3749ae193c3021ebefd15c1f85e0df1b8629ea0 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b12e9600f08201db14c191bcf5dbda6cfbe1d5a14a23d2f1944d1feb1b1fb66 +size 199058850 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a44560c3142a90f40f68d47e0e374265437f9f32 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f1597bb987157c88d34dc84eda04c65e04926b9b5f825029f4e2ef4bfe42112 +size 199058850 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a68e80a1c71de1cafc10d2ceb38f35e066afcc4 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46f48fdc425366a5c8615f4598a3ac8119546d5e68eeaab8e708b73fb4fffe56 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46a8393a932e926c3a45ec91b30c6508e4849d66 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f3e87a42c2f39241f316a858df5f53cd54c33d54afec8c1c401a051014dd255 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccee9b522917e45fc124461b22dc6e42ea33b931 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d56b0df30256fc6cb4468c55a5a272db545ebe34152999f4820df4235cf78365 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22c258817ce1bb3a3057d62cad816cb2ea657a66 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b950fb5afe1a1f61e4ccf317817c0fcaad9307d20b49aa7c4c2a0d95dcee8131 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..698f5e26c88affa6afd4ec81388d71a4546fb41a --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:524a9c82be91ec134fae129e75a3d0688a43a783cc75079a618bd46c19270397 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b2b92aef01ce29845dc1bb7b6d8149adbab7a0c --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:619ba600d21cdd86c514f65fc2da0b30485165b3dc2d4ac837b80b834c85a476 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18c1571b4f7cb252e9f039a47be98df75b72cf32 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8513553c07e2e6fc50968b0c6af8ea05e4fd3d7c48a644ebbff9cea1a277fcd2 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5026ae317f65f1b05782604cbbdfc324e365afd4 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f686041aac227f45b28ed475bb9875d7f16d536e28966b77f02a6cc274e91446 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..116e0421d67ba2dd6702f57936aa50a5b8019b1f --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47e7abb5cc46c11771a1cf669ce88273d723d89f892cfa8a412c715fa0453280 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43fdd18b7b165d977dcae04114fc4f0f0249d8c5 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:663d2f3b2eb2f2ac3ee8ea7d65e51e1085901f85d84a3ffd9aee6897fde69cfd +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2e2ff775664bfb9ecccbf9826f2aa159bc5a7b0 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:168c21290bd494bb04a7a8a1f6a55aedc3642da04d3de27cbf7832aec0f28b65 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49782cec01dd76e6eb9352627528f9b3de6f7b2c --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f07c5ea4fc22d528cb733a8ad2af9f028b5e719f8bcef4011ef27ff2df3c1d91 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ed4f512b028037274ae3e42c24a69900f06c176 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bd5099158583ed67931189db6bf67500b906e060077e38025bbd5bbdc1f10eb +size 199058914 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be6595b9b9f256f4a4633d35c6790a3d48893b53 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0995972f06258060565eeb6e82bf4997b555f2a477a01ffb77c600e41c7d43d6 +size 199058914 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9430d90ff5b150937872ddc1fab09dcbffed42ad --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c81e6b4f5b0017fdb8314fe7763c076c0762f089e0ac784278c5f2698617aed5 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04fda821c4ccb5686dcfb024ed51b33e5d6d7ff6 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9929625eb06d7d3e06d62937815c786868d1023a1c7f866e727f5babf5431235 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81bbf4673b1d291ef25452193c2d3cf99e98619a --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0312ec025e2aaa33cc89bf65359fce5f1fc9e9fb3495bd2b5076e5a7ebafa1a8 +size 199058711 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8ffd282cd07a17e01d7aa0edbdda378743e4e87 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc7d736b0dcc16a98ef71b4678dcaf444326727a279166e669ac3d1eec6f1216 +size 199058711 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56db008bbc8d0ff15cb51b56f24431e56eaac1c3 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70f50473768e0210ebca7d5098faf1de3cd594e4e1d97b093ba7f9949a17d6aa +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2684bebc00ea1b80f5967604a8822df1bc15ba8 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23c516316bc1133c9fa45e1234d61247a3cd20f3af2d3657e34b61c80fd680ad +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7376cbfbadfa09db50b10bc0be75229febf8360 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5faab908d07f42c7144ee07056d881838234e18cdfd770f03cc2510feabcbd1 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..111a796d9a060e98e76a8beb960ee50dd4277de8 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0117a2a29fb85e234343eeec58136e1dd1d02b6daafcbc873dee237672f0e8a +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e702a5518613ed5eb4d6b18b34d82960f9fbc702 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79bc6a11aa593c4f4a5d41d61ef99f0aa98fdb23b55571b39a18f045bf58f2cd +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec859ed58b5ac027afd697c5aa747fd9a36a6474 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97beb96311c6e60143ca5642f141024a44674c0f53fb2e7d5ecc5f1f2c546514 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcd8fb0c68956e38650a35174d4c6b740da6a46f --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a118eeb5be5cd1e8fd1ebe89ababbfbd70c3b0325e25a627bea61eec74705858 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..addbf1cd988d253dfbaacc6a074119cc8ada207a --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1858bfcc80ae103f45021895749a9db69c3daa070a01f1f68722bbc4bd392e2a +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9a6286e4d27c8223bea6e27a555cc54716ad962 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bdc4d1f985452da19e975d1105d0f4a7018449aba77da93d097820f13d71f39 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf96e057632301b932734d1c0004daec18bdae68 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a3ac0d5b63d03093da64f5771bb99615433c0c7f0c1481718b3a7ec541de06b +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45bf4199f79273e11aa442f09785395ee9f35b9f --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f57bdd6a0849f5219790e6ff1750145febb36eeedd4977a11c0dcd16062ff32 +size 199058850 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15b22eec503abeeac5f0253b135aabfd9e20637e --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:809a122662c67dfe0090f9d1d2abe4ce8029d3e2bbc0ffae6a89c2ebd98435d4 +size 199058850 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1728b1329569023ba18a0b39f9d1279b1808805 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a5be82a215fbaf8650418f5d72a0f1eedc2b5bb1f9dcb92597a5af731d9373b +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7f00ea5e235bc13fd76b59d3158c5abf35f9d32 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6faa0e6281abb007d8d6f10abce4b83f635d7abe8c64abd50c745279ba4d1af5 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5514672495c96dca5eca1b4af6d8df30aafcc55 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b60b34147417b5d5e35c80aff3f80e620e20cd4df74d625129a2638e44d39c5 +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3def78f5123051a20c4d62a23627230b44f59b4 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d77b903154fc25d5807496803b9e3aee42401ee62cedbd5033fc7c3a43e227e5 +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..479ee2b476c47e5fd926936e937e6684398fae92 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31645c20126d33899e66ece149617c08cfccf248d255e25e137ac47a2726b07f +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e29e213070afb4682a1579982263c82dd1fe773 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39116efc796df54d98280b8ccc851b4461bfe237f1fab4ca55aadff6a8b706ef +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f752010f6ac5780d7e8f2d8f877eba64ae31001f --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62076ad529415c8995b93922475ac1ec4a608fea0f4e9cbbbf1a498fcb03cd65 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..faf8ff9f0ed0df3f372a934927eaaf9077ad5f7c --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58ba67013c37b920d879190634de91f9d269187e16f9b2d473f3a7dd44972b5a +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77f685b5da9bbc1b28dcc2ee3e748662ba4eb2d9 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1be21c110a695cd094c96a32c20e38d80e0ca0a50b362d95a95a1f092e38bda +size 199058647 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4688547968799efdb097df1e5ea47f92ba73abed --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d859cfb0236aad1436783dde263bf00a1dcde268b166561be3d3a59f1dbb7aa7 +size 199058647 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a704d99da201aeb5bf1816b20779e752232060a --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a3d742cef8763ce0c4409da9bc3832cf86398d9d45162916d8e5f4f668fa6ed +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef12fe814499845f244653c6af458e2f62bd8c9b --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:432816001d6bcb957fc17aaae612d338332a7f0b63a148ddc213e07c7364674f +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e01df16e535870a6dc1580473ba4f479cc3b14dd --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07bec6ca4d016588e67d273e04cb08267083110ba51ad31edc50afc3d8dbe909 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7c7036be1e91057920a8fabd7a303f0cde1aad1 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ffdd7e4255c0fb49ab297249e5b400556bcc5e4c4e20ade49596811d11cd9b8 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42f49bdf3ce6edc4919e51067cf99c318ac0582a --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7fbdc90c662918460491d4742cefcf77469d4c2f1ad3f4772ea8ffb9c4a1fcc +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bbadec63f941449c1442e17c67c873ffdcfd35a --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdcf80cb12263516862619772e004fac7141cda73237399a23881e6097a7e488 +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf84481e4b02990923e326aa7c7b0131ea829228 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12b4ffdc798dfab13b624aa8ca4cb30f96a33dd7d01704310068115309f202c7 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13ecf991e663d524a3d2e97f900b31d1646ed726 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f00686662b83c339f153a294451d98ec404bfe95e3da2a20f0f6e4ea324903 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6eadf8c1e40b63a8094dd7b9de4db1bd06d2d51 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0663236e2f2ce57241ae35b35f5e56711bb5bc9e5f00a8d5e08a66c4c605518 +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef1c5f1715d1ab9a91fc3f91c0ec879a087b0aa8 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:580ddf5039a07716dc902285d56e7958df131674393a8052b5359a9e379c6757 +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a40d22ccd119d2e03e341114b0abe80ba50531c --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77851e6f741dbf217a6aa1410d62a2e58234cbf063e187137a45e504f6c59b7c +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f31ac4dd771f8aede801154b1f9599ac8f3e3bb --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46d16099fd30756ff3403a735328faf4b11978ce5f841c1cc7aa74f3c6e5ba82 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..819a2b2b0e68f256e7f776b904f28de9a6637d3c --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fea55730ff6439eb9e66012c1b9f480c5d2618893236444316fd2bdf15e4ec4 +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79225021e0b5ff59135d96af9336b669d1bdfe1a --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:849e06603a7a8c8912d8b59c908c460d0e331e5ec47bfcbfe271e95e8cb6967c +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2bec5901ed1b2f4c3c3f9ceab01e0b9ca6b397d --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44b7e475021a8efaabdd4a94e36f9fe4954c9a619261428773dbb508595ce79a +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea7d1abbdc42cab5639c06de688021e398a3c965 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:730c0e7cd6f1b6adc8ff0abebd0bdabeabc499e7bc40df12b43cbedecded6fd3 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed9eeee79ad9dc6d81b4a87f17d361f3fef91739 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:600e865f10fa7e11f7e2ec2b087fe530cb0bbca9b743133162fb4de0c2d384b0 +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a873022c125b87070269e42c2d70041ad763dc1 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5b80baf6d98871be975c489c834fc8646cfe2b88d3c4117d48f7f099dc8f40f +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7244e093aaea06535b43dace394c083d949e72c --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:440ab21bbaa223c79eb2e410e0298f630425a274240ee8eeb9b300c3f14fc0bd +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b8df5aafd90504ed55dcd386d9f279dd061ff10 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e5c8d3c4496f43b55e3c7f44f92098cfbab937bb8ac8b58c0e08331c72da13d +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ac4f8afc4cb8a1f992dfa3853c78f92810b0c33 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db89ac9405a3b49a19a47f1b92d7dfb59fbb87422332e1915719a6d4e3f53e34 +size 199058647 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef2d1a006c767fb4508267f0957eba9c8eec45ba --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5cf566852fd77bbbc08be2ad240e53e1cc33e18c8a0dd6b8a4d4dd126260943 +size 199058647 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6864566044aa1e765f1bbb04cd70e83bb0a09031 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12a5727e082c708ea90bd5034928379fc45d07dd420aa92c945afa8687bda7ae +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d92e9ff2d109a7ee53660980cc333ca5d614438 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a1059952e2343c716148442498d4a21fe3e08ef92bc5f66cece2aeeeed17c27 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3523618fecc7fbb29a049aa298f0510a0d5f11c1 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9addbc58d907cae86fe766fc35b6a1a86be3b67fe66c24c24ebdb7e4ca84e25 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70cd438a9b3170f9ac46658925fb2ee4caf26d9f --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2339d2ed7080c440875a8976201c1f56cc30a3205769b52212f81a9a6d8fc51b +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1154922427516095ecf3cfbd51168ea34c65208 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d8a42a883a943a94c927dd4b1066bf35b3ea3e8485fdbaae7495d450babd0ff +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9133a680ca12cee54a52a66d5c8b1f3c61ddd3c --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a88230569937b145eedc6bd7a0c0544aa2e1a37ee9205fda39dd207c6cc01a2a +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a59d36ec77475369e605825627a3d9261512a71 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33c46b5109b126e4023a29b52da5b8a51a5b6fac38234bd2dcd168b6408ef3c3 +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..abfca254234852e674c17c6f2bf2507c1fdaf6e1 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc42cebe227bf12be24512fe480d18d8a704cfe235b85189c32890efe03e454d +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ed442486d25257474eef8bd433e16034dd67a2b --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae894c9a41b425c13927be0c0437262fbe323f7e565ddd6d6f0481bafeca7af9 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1131ff2e8a3fd42fe2f7acf5e96528aa6828a84a --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13cf141e6173dc9dac6b7d8a2eecc701d042da12b3cad599250020e37b169759 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c293a0d260bcfaa08dcb69bf2efeec8ff47b2748 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a17d712d9a4e5b2918c7b555412ba788c4ca1aadfd82c171573308e420e3c24 +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..309eaab8d9017e52357248254d2bbc2f251d55c1 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5ab11a4e2041c076926838872bbd25ec7b6e7111f7e4165081184bdff625527 +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f272d649cf14ed261fa299fc66eba0601d878677 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:576477a9a726ac9f00007f9f7c2deafa0c4d5d17826e70bd9aa25e8b84371e03 +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10bc19d08779259cf2f244143b1121299cdc02ae --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6731e38681b65ac6114f6634a04f1b83653ccefc201cf3ad07f4e6b1ad6c72d +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98c43780968466a299d52461a31b63e36d81020a --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5660d786f7db8fc889cd3c92adfd9da35da13a9e1ad38a322f073f977da26e8e +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f33337b07f242bf78a9082fd388a746cf4ad124 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aba4bafb93d1f2cb41af9b2ef7bd165d33ad7e68b2b17bb9ee5d1489169e572b +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8d67b8ab1693efc40c5bd4220cb2fb051e2ce35 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc530555f767856398f65eab82fa0bb25992f08445a4172ba66483964a000ee0 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e51e5ee24e4aaa8e108b0381e52670fe80344f02 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02fbde076fc3b4ffdf3ff1cf82dddf90c52358f225912127e5fd9305a3590788 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2020b10ce5c449365134dded97e1100b4e882c37 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f51bd82021519db9983601cdaf18078bf72542f925ba1fbf6ccbb26c2176b2b4 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f70d58d80641dc3b5e47cff8c896db12ec0c22f9 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16701a72516507438f2da5b0eb50b606f35bd02db480d5b68f96d6903e7061f7 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7940fd00b4832826f85d58f464653ea0157386a5 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1a01e7ed7b17202982bddfad6404446d7a5668744a474e479f863f8f1250b6e +size 199058647 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b73c015f5ad5631058093d89f058fa184100dfb4 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:749b4bae3e53193e558a2dbe0557bf1f344dc2cc52a854c69d33212abbb2d649 +size 199058647 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e16fa7b0a4762c0b9be148088a224085176cb30a --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ef7f290004d3a8a2d94e29e62329d2b7cb84368f2d40b0f60a3adaad605778d +size 199058850 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de4603f804ca703fc6b3986043915b108ae257a9 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca3ae71eac6ef5d161adc3c26b8f57e03e952cf297f98d539f8b83e449c70fa6 +size 199058850 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32015b29eecd0d93dc67b15c28d22fab2039fd83 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ad00423ae70e7efa14ab592329413203fca0f6efc5a8f1d7cb48a0bb849aa18 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fe6b633c875e703223bb13770fb3e1f1848cf13 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:134a8e358ad4402620ee7d61927fedcea31aa18c45d1e73e784af21fbcb7c054 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79697c4332482cb1194dd3f68966d66dc7788f57 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:699d52646f38b7f79985051c8cecad8baf1185e53d780b3a819315a7f550f0f6 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1310b4c23231d4ca53b66d96eecebcfc6bc02ff4 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fb3984fbfe5cc62f897efaf40622e320f44e43c9212c9e82cbaf7b9bc2f552e +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e62ed642e76d596ab8c7512c2a23eaaf7736f218 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9805e3bc54126ed50a067f49c9760d6ba1aba40d1ed150d57401ef9518f8351 +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..617cb002fcf797780175c6b579e7cc11c8c0fbb9 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77bd703399fb6793bedea53e0cbc4ec0635414cbcc559bb8a053b2f37374d076 +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6816ec06085050fc16b983aaa0be41a384d9ff8c --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c99fd8cac19645c24f5e2b6c1d4d04bbebdf30bdc4d4c53e7f3ef356f2d2073c +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75067adcb21429ddcfa1a23a34c2d954d57caa0d --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:269d1dd7f82229db3e3def9d0644fed709a7ab05ec11084b1d9bb16ee1cbaa74 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07ba631176399b854c6d467d5e5f69ba4a91e8b8 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10b05949e1393ee77156900385090c774e2537e65e00505a68d2c3e75a616ef7 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..792f57b5621c7cefafeb0c4317ed6c01b1258a07 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03a8a280a4303c3b49be82ff901bf1ab5a80af115ca88af705c3e4ee59c67f53 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e59cfb1b8f7b5bf0540cce12556aa3656036604 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:087455ffdd615658ab3d3e8874a57f6aa42e5513e57dcb503fdd7aa9ae5ad8f7 +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc4aa6e5a577b96b5b9eee5c75880b26c6735328 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b09c2974e5507e610dca555c9bede326d18e0e37da804118f3ac06c305dd862c +size 199058722 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f302ea78d3077548ab00705553f40b798cba59b --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35db8296ac799af78be8fb807fced4890d8010e112503c8a1f73e2b28bb9f06d +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed078fce384b360a6b027d04105f9da9523850a8 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:933a09eca7331b720db555e807f4d174e7fc4715b72471d56f45469a2060a314 +size 199058786 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5f8fe7de3be0e5b911b45e17b8fcf7efb0e4a33 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:296b939f6ee49f5780fdd164340422af76a8ef77128f8e4c93758b99ef922b43 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..267bb2aa39a23c9eefbc81a9797912f16a63d586 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b9812da3f0ba9095feec71baa4016b27e4aa2a0365df4d69e48abe1f8e7d7b9 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83eb884f9c2185f8ab8da3c71af314a7a15d2d79 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:114514896df34d2931e54908678f2ec598b110a65ce4ed79d0fc97172e45146d +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a2bd2ac09a0e7ec6cf192dcacd3202159d64736 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf75a1a953906cb3ffa71eb01ca75edaef06adab92bd64dab9c0211e97e16a46 +size 199058658 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57d35e78186234253ffbc4b54ea4635cfcaab234 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e50ce3f62e135b9ec4417605f9713f4b70ed707ae5a280b32e746e09260a2d4 +size 199058839 diff --git a/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13abc018bc290c1d3187f8673c4651199ab187ec --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e312851e9290911c77beac6716f36eaa4749a460962c0b4b08d7387bf069068 +size 199058839 diff --git a/4b284b21bc4seed4/global_step80108/layer_01-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d5808d713136fc054e3f34f43b3d9d2f8c805d5 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcc03e2ae05334d8df33a487636c7c963e8175b0a028f373c75de3b0cb7c921c +size 167511299 diff --git a/4b284b21bc4seed4/global_step80108/layer_01-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d86155599ef83badecd6f10ffb01f486797558b6 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6267e874c6560809240f9bf493975c797d664a28de3d7c998cb96ad9a343e565 +size 167511299 diff --git a/4b284b21bc4seed4/global_step80108/layer_03-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..022677299ad6601aa0e6048448bccb6acb90a966 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e1a6716d49917d4cb0fa07ab27a5356b4bbed2f2b9bd9930375c1068662b749 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_03-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..626a099b4b8d3274d74b04391f3484f6383e0ee8 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a917a7c0a39eda9feaf6ca313e27b31988840b9c922b02025fb752efdda72bbc +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_04-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b1522c29dbbe68a1587147e8d8961806bd178e2 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e82c09c664585eafb8abd4f669bbd7aa5911994ede4e0e732fa5ba88e8f117d +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_04-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2eb9ae0be7f0f017b999358cc402685df67f03d8 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13e16e059a2c027b2244f8c60598b3e19a0f940d62533504ff9b9749881c7ba0 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_05-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..878195e8b556a67b3f8d8ea10407ef8af2541b82 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9f3327812e81dcf61f47d6e666750a2a63ac73f80e86d847060325e91c189af +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_05-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..316722f33a4bb1dea5f4abfc607cf6b953e3d3b6 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca79a1bc86b1553c887aeadf2d5b8059879de852da691fb6958b708428a171aa +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_06-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e45a05bda350743fe88d38312e042b2fa5fecfd --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:258dd56fb317d0fb57bee974b15a8673990616389a2fec987b56671413b0f1c5 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_06-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f68bda17c6a8d9dd643b2e470b5bc8523b484d8d --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee1750a3342717379f3c68e2c353e28b07a93ca9b3766fd561cbc90a6679eb67 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_07-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..577a0f27cb00fbd67474891968c4a033b7b80b13 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f39d08b27c19132921934222d5de7403f27dd3ad315bf1dcec012d2bdd5b80f6 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_07-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25cc1ff27f349e4c21a058d2ab673ee5dad5e9a4 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f10e062b5f22f9b296ef273a4479d0f2957152252cdd85a16bdd35cf13a2df1 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_08-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5dcffe28873d68077edb25a2a18efd43b6396e7 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:439a875e63e04f609a005f5c278fb4cce83fbd662a702de387bec9eb25bb3345 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_08-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a2aa7bf3b39135a72de1972281fbcb6901ff123 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:296380026569982082477d54e34da8cb24d3eda128801c38c8a4938de4d31f3b +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_09-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd1093fc320ea9b2c88645a65d523add94c9bb81 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3db43ef0febdaa4bb52733fd756750697951e93f1bc28fb8833c2c20745f3943 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_09-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7db646bfd51ac609ae9996275ebca4b734dee6ad --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ee6129f357452dfe3c06d42055f192823812540b39fe9091dd9f56b3f2ae5c4 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_10-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..deab24cf0ae1821884035981ae4943138c9d1bfc --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8fed9b4268b12a29d88c4089f82a15860fb850833f5f8f054f7b59ce0739c4e +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_10-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a9b066d733811eff778e66b391e9d1ac623717c --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c09fdde8343bd305156f0d62e3df6469f497cb5ad0774fea4ba29fe6e881b32 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_11-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..352b35908207fb014f136aca29863176724897bc --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:557da42e7d33ca9e184144da5f1a2e2d48e53797a8f0ad5d283c2d7396a76128 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_11-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8a9bf5844dfd540a189bfc6f2756ab23934757b --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c66cb5b5cf63912b633848dbb78061ea04064946006d6df425247b1066818249 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_12-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90690530e90c66e3c661814b38375a0b9b260309 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09ce6fb80f3b752716e3342acb896aa685c0bbfad9b325f2de2b497f0065241b +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_12-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d5360b1b066031a2b5219fe0af60d15efe7864e --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:839de43165776d6dec84055f2e98b644987c453643c7083e5cfae3e3bdac4f86 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_13-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf6aaf069a5cf95a6fc0bffac449a648e684f443 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81e349e490d5f7e47e7e8e0554634a4f7d0d823b04dc809a022cb274652231c5 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_13-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e633214143d63bb01acfa095ed95b60ad137d80 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7faead1331325760e42c53467d078c46a7fdd9cc45bc8d0c65bc77f909ff1946 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_14-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92dda6f31748366ee2eaae53b913611d297026bf --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9098d40a8b259dc43e3b980f4be125759e19eb7a14b4e45fc088bc9aaa2b1818 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_14-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b65df525ded2812a8f5daeeddbfdd6806b90e56 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04bcde99f52b0aeb890f92376dcddb6430ad47d9a08eef83029c348c392fd82d +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_15-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cded1248ca5af03832340ee79ffc897b5372116 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:761ac21ced560f98e388e2d9a1eaff9892f1b9a30aabaada728433eb53a14e95 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_15-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..989126b6a885e59e8a8f9135b7702ea0bfe8cad0 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c15305bc6cf826e0dfcde52fdad4f511f2b6a7fad6d9af6d78a4ee07602422aa +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_16-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbce96805549436e5aa673f6ca15e8004ac7f2ff --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19798b3925ab437186be299b80f7da727e93816b86fbd7ccee78a0c35fc9aeb2 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_16-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8c93df0404eac54e9046e6c8d9dfad5d157811b --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46304225f729009bd8ed3571f3ba6297383083fa5eb300aeac4a23445ca07aa5 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_17-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcce00614834750d381f3453001a3d539df80497 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42267e2d79ed9d20f654f9ce1599e9eeb4d74ed0bb112aec9d162174027552aa +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_17-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..523369167818e36c2e2f7a889172a5e6944c8d82 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd149808c053f189b35fc4d06b8b9fdede5580acbcc599ff2673b8d4a23e43df +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_18-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2802bdf332f811f50b98b0e8ab898ea29747e9c0 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d962d9f9587b6f292f8df8404bd1c66ba04d47380522fc435a61ee7f1cfff152 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_18-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebb3d7a6c5f0b6305ddf6e217e9e2add8ca4b161 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af15d504db5cfd31841da5a22ff22f365888847b750c1e12942032361ad8c341 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_19-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44db2167ad06a8183a45b675c2f0e0faf734d85f --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20cfff5d01c47c35a4ff3a5c949a0816ed506f70d733dfbb79f50808d3c3a844 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_19-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c25ed1111bb1030a3077b9a4d5049e31f551bbc8 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fdb9d39807165de1a5790dafb4e829e59ee7fa7c2faae6ed1a7720b3d2c9c57 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_20-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e16e6cbfb1d9571a2823f87a99508f58ced2dba --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4ced463d16499c7e6a5c306a803f3b5969146e30f562e61d697b639ba268a71 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_20-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f101d6214bd5c3b59b50f261c247e8c28334e81 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84799505404cf9e186347afa097615e3778dab7fd4cd432c3b47f1218b88d85e +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_21-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55c5db4db8ce87efa594b67e2bc518b35c90da97 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71e991ee73c18d71b58635a9490324505ce8a52e429d9694c58b30e03db75562 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_21-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..514b23507d9dae26e056f3258a67548ddccd03f0 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aee3836978bf70152849f7349f4d125ef62282ac36effbea1fc9aa35dfd9c788 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_22-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f05072788e67c5e361c7eb5769b0c4616a0aed4 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc0d24588d221b7bc121ac17b410794bfe5bf7eca1cb2a900e70e037aa75c7c5 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_22-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad71c9fa5d1311513e86cb0f18523fc5a9ef7a60 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41b3024530270e805f5695ee6b5656f9ccd4ccb09c597abc6ffa4ebc534ee5a9 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_23-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2a8b35b1854c9dc2faf43e00417bbf8c545e0b4 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2400dd858a54cf495f7d51c3b3c15c24fabd977de516e7a3584f1d3559c1187 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_23-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18eb3b21d09678f55f2d312c9af81cdd0613a1a1 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f572e960212cede42b302a248b33f437cf9665eb38f17c1806c1fa7d047e692 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_24-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5726d8dd083ec5af1f21463524efcc9d81d9d395 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dae5dc84523e1d690eaed0576f991156026a817ed773ba2a94df09bc087002c +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_24-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef87903bb6245ae1a2b2a3987f881504e64adb96 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96bb427fdf4e88b3a9a899d1a0f2504e99c8f442ab82b51accb068c476063996 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_25-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79a1b5f99a414a1e5a51b5c69d3b5f9171a9628a --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce90c1f1f26bb4a5b3e3af6e00f0609640483d0bf7bc838c7a143c8ce21c4ea6 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_25-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b10753b3c9df01d43aad666673cc6178ef48b36a --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:136d1bb242eec41d62c4b77e149d598e5a55d1b905138bac6b9e20263a7f97d7 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_26-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a65426c4c83b6038b29556792863bd0838248be3 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e26b7634f3a03199a64d99311db6c738b0b1659226c3647043595d934dc9ab12 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_26-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70de1c389bccf0a75d40e66aa69052587e2ebd01 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85d101b3973f701b2897c748fb00ec17910f7c60bfc9834296002f5b3d9a7f3a +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_27-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56a6178b86ce7b20b6a7273c65238b979e736305 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3478e12303015b0ad78216e4b765b292050d6a529597a432ab71cb2955f0ddf2 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_27-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92ff796a959dc24abe5824d0896d8569bee894cf --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6058b55e8f5d007dfb69d6b1c351e2c6c762b21e3ca25b863dbb435708d30d5 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_28-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f84371d73d8da14b5f8f8a5d99abda06bf6d923 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0db93e533795dffabf6f9799dc4a557d8bf6fbed1e2d1fc11b23cddde1709871 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_28-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da356eba3378cead9497a03876eb2d05f7279fd6 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f20aa5c972291d5555ba8be6c034ae13e338f13acfccc1e88a6428d3bda57b9 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_29-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a5d785294f6d630a9b19e34d1d47bbee576b7fb --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37663e4799ebfaff5183aa78a4f5904b76758ec99eec193a614b1e1bd52f5aae +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_29-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d34a759a30b176dbe5349951121fb6f18a1aacbd --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea3044c400d4a414a6c1d4db1a6248c9e2b91fb8ad1b1665716d06194431d741 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_30-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcaa7262091fb32e03452497d8ef8049384db766 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6aacb8590de4d4f305a61502e90229c6d5c4c09616295c8f232fd690d63f05ff +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_30-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..279d08c130167ddec6c381bc4eec634891a31469 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28e76b491a2b64de65d0729b3e354d84b0c3d083506e3c5e065f0cfceb016a58 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_31-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..588422e9487bf59c6aa834a19810691711aeb8a6 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f82a25bbd6c61f0e904f95e8ab27b082c5c4a27861a7002ac05483fcaf80d59 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_31-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61f5799d2f3c81d9adee1c710a164deeea21382b --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da8ae5e75e0743b6c127b934d4dd2d334f893f892183f9604c0a086f3efb7404 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_32-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50442069975288ab0821eee69cb3bd3646b66b96 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:584b31dd95df80992d13d139a2eb87913039b39e05161fe3a04d5b3b0b2d6fe0 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_32-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ce12e2737a00df9fa80fd5146790a7a5158c1c9 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66314697ccbee6b4ce92b3c029ed8a91e4e7f0e191ca23dcaa2427e86bb53781 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_33-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a59b21f658505664fef5cf31f032ed0e006764b --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:948205d74035fa2c58db711b858a5d268cd9df8eb689958e940018dc4a48ac15 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_33-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb96dbbd9d6bc6bd2dc9a2e20d61669c85609942 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89e53e03cf1f5e4abd22b5f71d19bd01a0ab77c39b18205ecb27860002a680cd +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_34-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d86914a0085ecff0064c091b9819fded18edc45e --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89da7f691de7a8542f22d86cb7e8257eb6c8ece00fac780744aabdbb5d30df30 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_34-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f25de5067f351a5458dc2265b179b710bce373a9 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72776d058f424751f477a0938f8da9775d0945714cf513ba339e8b25317b32a0 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_35-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5846953f8ac2d6be40b3bc32f886a6d2ca63189 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:162b6ca9f401c9261032f471fe2ec4c85654c3c082ca62c6cdd98dc6648fa2e9 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_35-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e240b154316b8d162173f7fc007268cac5fe04c --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dd506c32c2e55650ca4b9e77af8383a15bdeac865f4d2ed3f93ee48abae03e1 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_36-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..347d2715faff1a30b6d19a76301258986e5a2693 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f006933d512ec435f6e7cb5d167dd593561427fef3b515c3aa218783cfb5bd4 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_36-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ba7c81157990a1a46623e0b54e7232936fdd461 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:710bcca892e15ebbe5cb4bbd19f8ec3edd4fad8a40fec1de90dfb23d89390ae3 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_37-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f78116e5142efaadb86804de26f279babb99dcd5 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8df98204a2c9bb7a23b354ffeaa7601504e6a23eaed9959a68c944e2f2802bf2 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_37-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a724a960c0b37421de0afc5850c6ef73ef059727 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cc68e411c0f8e7d3995c6931777edae7434942c36cd0e49fbaaeffc18890699 +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_38-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55dd0b1ea625f4492f0634b43f68d1a2633a4642 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96f9f01e24ef5c9259a372b89312f5be8c06b6b32261e5450eee7c76848b4f8c +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_38-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad6668a68e06533eadfe8bab7f1d8ac19bed9112 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66b9838e5064f9b60a3b5e3cae4d0cd9e144e6a74a092cc932b0a992d1ce310e +size 113308931 diff --git a/4b284b21bc4seed4/global_step80108/layer_40-model_00-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d217796323b3ca386f6beb7beac4d0ae5ad19ea --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b390beb1b5014b01288bef7509d3fae6e666fee4afa93b04298ca59fd340e8cd +size 13507 diff --git a/4b284b21bc4seed4/global_step80108/layer_40-model_01-model_states.pt b/4b284b21bc4seed4/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb9ef18d933c7681b52205ea248da56a2c0547f5 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49b8c55c480ed9ea68090a283626077824f45d50620aa3d315ee8220f3c99c86 +size 13507 diff --git a/4b284b21bc4seed4/global_step80108/mp_rank_00_model_states.pt b/4b284b21bc4seed4/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39ef32510fd700e6a5623083cfb6e2d1260830a3 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35ddeab8617bc4cf276ed20ca7acbfb9f01dc18ec8e1d11c598fc29a0d6cfc97 +size 51443 diff --git a/4b284b21bc4seed4/global_step80108/mp_rank_01_model_states.pt b/4b284b21bc4seed4/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a2703961e5eb94dfb989e1694b4fb4fa097b822 --- /dev/null +++ b/4b284b21bc4seed4/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28d47e39172d5594a32fee2e5b4ea4291c4aefdb37dd46ddc26dc2ee11535556 +size 51443 diff --git a/4b284b21bc4seed4/transformers/config.json b/4b284b21bc4seed4/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b21bc4seed4/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b21bc4seed4/transformers/pytorch_model.bin b/4b284b21bc4seed4/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..724b783000501beb3f60f57324980f4edb86a055 --- /dev/null +++ b/4b284b21bc4seed4/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7f4fa937017d12092f74e45e83873a4a2534c465a15d5a9842b0303308bd75f +size 8781203669