diff --git a/.gitattributes b/.gitattributes index c7d9f3332a950355d5a77d85000f05e6f45435ea..c9dc472a0977e1c79784f0557e87f92e2a1584d9 100644 --- a/.gitattributes +++ b/.gitattributes @@ -32,3 +32,27 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_0.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..7e7839f3d47bebbab63ae19fcadb83b03e27af89 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.35947270396511505, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03976947372157981}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07545439815870926, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0022680323540535106}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3521835615440358, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00619686620162303}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10839552028832326, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021723652033459194}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.032699451519105735, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001384275605757562}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.15406776335401268, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003465085716143713}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.047276019716226934, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012856377731630094}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07039855492701995, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0020974056683073722}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3340045099502354, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.005873382118908422}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10130202856745985, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019472676322570249}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07004936083081541, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002133247465940297}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3244285334323993, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.005600594696630026}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10030698310345207, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00199704924468202}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_1.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..4eacbe87db531c10dfa2cc15028c358cab731589 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.439590405391749, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03639316276575898}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.11798108343049835, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004189810027811706}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.282170938801227, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004883544121946002}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12947090595404617, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002852782352526057}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.05196889371341826, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0025533461681694508}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.13218044825747446, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0032380010251441865}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05808665518589103, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0017777894288570288}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.10825494458392844, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003904994298291327}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2645472840621899, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004556021445746197}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11858785172635401, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002478780617084794}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.11031861099356242, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0039604815937864905}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.26713799982719905, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004549761006024966}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.12077915827100709, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002551676685757977}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_2.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..2fa5f6d6aea2e4c70b3eb04a6a705fdbe45e64af --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.4327894307296322, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.024640640059482456}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.12297046315173006, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0040897147406697325}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3042534732622601, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004903877544018215}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.1410031634689578, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0032324876149143174}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.0576039991584552, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0025535933466243133}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.15077982517511446, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0034374572449847826}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.06752669346406527, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021138358803451953}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.1104912096950109, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0036047067672774166}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.28546625761473593, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004574662165094106}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.12796808140720628, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0027316442230635152}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.11307661210149669, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003718228549147224}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2874301444825106, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00459624777457841}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.13012460046320815, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002821583895708515}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_3.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..0dbe04aa820454031921abb47cf320ec09f7854e --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5404686599298022, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.022697653617625668}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.13845802128499135, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0045597656509502645}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.32092040425844226, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005008296587989612}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.15560884002865294, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0036234626616506445}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.06702437748497692, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0029685771305559}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1620667235472547, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0036340890774095654}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.07669311585498696, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002447936846513278}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.12473752815218381, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004101879009707582}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2996525326692619, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004604365063870675}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1408131779527577, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0031033792829699013}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.1278080751942467, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004213519190229}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.30254217709571163, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0046415976176704355}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.14358670900260256, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0032033835693374485}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_4.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..6f804de1fc4afb7d37153b2e74dc0bc34b8d5589 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5742337786019259, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03878274750055446}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.14086556381172718, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004428332001204429}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.32551921944528406, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004991227840335665}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.1600235914525449, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0036097572997394753}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.07032835967682173, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002913207949737097}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1657469934541477, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0036471777846592795}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.07941872657600588, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0023817203208560513}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.1253787475855925, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003857417568887736}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.30410641236844715, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004626592417361122}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1440562866504595, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0030403449385889405}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.12869971530300842, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003968071565769882}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3075445892543285, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004678706009218115}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1472101403273607, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.003138866129665981}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_5.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..986ba5ce0fa36bdcb840be5b4570cec533d40750 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.635110535837625, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03871788894965444}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.1525500458853948, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004620561884453087}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.33136495455869663, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004922267534666466}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.16874449129697527, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003695736819713046}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.07343448799144045, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00283017590959593}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.16823943214461987, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003586567555229492}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.08341646218330169, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00245206001866393}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.13575531369040605, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0040450583472974805}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.30873860481408066, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004580652118490307}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.15194218033858106, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003180047227446292}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.13990818551922082, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004203614112801349}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.31270960518749086, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004631706988744322}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.15546806288792936, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0032849232577235156}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_0.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..d05ef20f7057c3f004aa2bc9b780143d9796469c --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.14065522911885284, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0026167234065659377}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2077858455356502, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003207547563015362}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.15054961097467578, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00226377650907843}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.028936499156918462, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008308890956254622}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.047621572002057626, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014677026992242054}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03284973650336109, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008901474353695594}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.10891616878029095, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002128146385613769}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.16364999329689073, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025474652737291228}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.11606660794433771, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016651813354424878}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1297853946244735, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0024785686496660475}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.1912754353743984, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002981659373353225}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1383437322796597, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002090310705469885}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.9837825625170797, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11075715745007846}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_1.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..9ec74efb03854bc00bd5f46496246d39015d1a1e --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.2762425105029227, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003910267300588051}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.20834745854239614, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027380965011137614}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1947910450168483, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020869483396049704}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.08055553948421161, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002606559746437613}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05150103955877206, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014183315910517708}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.049392514158574624, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012208161442090015}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.21851702868734507, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003372441044700006}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.16057548751118275, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002148069814749071}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15001937245323257, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015991824476393945}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.25916065316674775, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0037279536032471168}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.19441611485589055, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025510292731691516}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.18180570375726848, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001936138194096433}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.731757866860902, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09401566144028131}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_2.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..10c3e6f5b8149f468ac7330b9d65950a6d9a1984 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.32626754575036726, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004160952183668717}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.20383479538093535, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026993794458441043}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.20613936702027444, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021190894920928268}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.10007636311761049, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0028550431288296794}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.054415586299804586, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0013915187854267616}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05603389382170741, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001271062816942248}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.2635619488392546, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0036380974285539374}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1603578397536738, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002146919731505488}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.16252489097757244, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016718094991769424}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.3074344862627562, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004014028577734544}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.19073199447466943, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002535477745360056}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1931517785284218, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001993853381084745}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.9322639050220105, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.12143454557270413}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_3.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..4c7a8018e58d2847e3b77c9b3f38365e0c380828 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.2922725222200554, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004651782939278748}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.16905603244144393, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002893722815519241}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17399824491538346, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024206540471267573}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.09252698046948368, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002866844020761}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04722768100471586, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001416812413385918}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04907480009549843, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012971765065339716}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.23838599830741092, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004037065243320852}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.13345263947824532, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002299889404388408}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13802926833801735, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019272093177852146}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.2757198208371055, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004460275498557492}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.1579566276306941, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027014936394507074}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.16286062730037856, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00226402618082299}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.012414052522073, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1192976063075274}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_4.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..9859dd8c60cd89da5bc20483f3fc34ab2537c414 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.09803780862444332, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0037542079984195773}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.055939650256776254, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002208174292715702}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.057375310609982466, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002066242545550384}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.03142995177369586, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0021038457526255747}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.015365143064306497, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.000979165685417275}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0160305041705034, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009438720743795962}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.08097565827758714, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0032427815281044717}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.04471738861035188, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0017641789615113678}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.04608597234875565, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016726995424030213}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.09182775554453593, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003564574100593056}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.051912990141086475, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0020473017772187473}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.05329542007268218, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019209202512399431}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.03493647315810699, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.005631810107220299}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_5.json b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..0243bccad5019e1e76e89e39f197870e4bd0ca48 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.016993736073454134, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001788546858364124}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.00900637633671815, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0010107140778820775}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.009395500241536013, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0009500689605104234}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.006211648856695909, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010267488110128425}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0026828841173024234, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0004381628666649999}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.002851312099021117, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00041531186668653793}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.01439613464214093, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001575501685496224}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.0074140396273133825, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0008325976973129966}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.007773827425357832, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0007949106358400926}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.016125128414415275, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00172636694363769}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.008465582889960955, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0009496466031975232}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.008833738275831978, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0008974890832248417}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.8561305401207938e-16, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 6.947302305993717e-14}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.json b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e8307a897a538a3c4bc6de5ea09e8a96b8728848 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 5.339927044871696, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08872791568340165}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.2515052662950541, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004870810614140465}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.3350266606904938, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0035843768019540086}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.2226828217679673, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002249745722118871}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.16308756446343287, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0051770263257276935}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.14336931732901514, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002169181508375878}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.0962466409781981, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013503218785409525}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.22734045427809546, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004892427330623474}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.28693034972602244, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002969166803920127}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.19096195261765536, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018135664975555404}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.23625674969124535, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004917569426738765}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.30234122307959604, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0033569459426124634}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.20222274630326326, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002112367456590073}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.json b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..86c8afe5f2e2af1493ec2bee44608ef61dc471a4 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 10.995645416426365, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1355301364434119}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5186991843866234, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003179740997511602}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4184117679002587, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028975710111925493}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.43760763192725927, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002294835733825743}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2385007362385778, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0024817174189763467}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.19034676067668307, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0020882764951960587}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.19885963206818635, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019191251133340809}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.37694670026209454, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0027655570482716324}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.30206571148255096, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002359583500618676}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3161353012742636, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019606253829224825}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4227955643807066, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0030366933000180126}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3403465420378745, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002668047106474485}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3559670164748496, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00223874305132682}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.json b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..5d4f10255be4b7a58f9c2ccb707d3ee4ced1ee4c --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.721286940077317, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.19094329154612846}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5229324602091411, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031909121835382993}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4401132076058208, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002805311642371223}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4535479079186711, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002205157637138293}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2525772319738568, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002506980505193317}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21097394329000255, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002155594256646686}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.21668784494769056, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019317691466643027}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3865460480893656, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0027749325148882765}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3249916440696209, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002413104785614359}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3345469747204765, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019950150742453652}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.43548565683836865, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003060969562227986}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.366407031063428, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026844596720968987}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3773720477580653, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022315833379365027}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.json b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..2d87e6d959c74818d7992035c9b66c6d338717e8 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.531244841347167, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.14804992137109332}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5201401768255047, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003087529662537695}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4499141314413611, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027731042114211733}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4602006690975045, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002202958672501332}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2537225301220307, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0024510739744713675}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2184563815633649, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002176238990613196}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2226349693599192, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001956593053550091}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.38767169950748886, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002705530894575463}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.33483483642414963, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023947056400905062}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3422005085679842, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001990890594788978}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.43884036572466234, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002991792920013415}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3796460763325496, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002674393195242478}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.38814660645876126, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022505112996719723}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.json b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..0d3703489ffe91869128929523aef65a40f1d701 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.144641083132381, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.22425257366332665}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5172514001918539, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003026409634009829}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4404595087274305, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002720085033791889}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4543948636144128, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00216936378243014}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2515805000837444, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0024310452140277675}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21291756885767313, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002148428865602042}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.21910499180486853, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019460167284822956}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3890522315214248, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002719821689066892}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.33026355455414214, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023774186515219294}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3408417131350513, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002007724984778065}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.43842236175255295, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0029826343953932937}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3729149211806265, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026547829705833277}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.38474418787643466, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00224573532936523}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.json b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..75f5d72d4741a0b1265bfb8e72ca613e026bfe5d --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.123048347593052, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.17809694322426664}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.517549307513542, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031180867210341256}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.43869061890223154, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027334989737563755}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.45359810879893614, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022034543872964845}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2511077989934143, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0024722315716345553}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21132059138033674, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021474197073557645}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.21805791826958687, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001957141790282348}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.39019517006735716, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0027358415117223725}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3300349352658418, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023622100586565727}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.34126459914946794, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001998609558923375}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.440642917422858, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0030367113114780704}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.37286555921974923, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026300003525580365}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3858165011376146, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002254962578090558}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_0.json b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..a0c43f39c2d057325a229efcaec004ae3fe897b2 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.14334820197523107, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002033372138397688}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.32917310914311515, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00467334236894172}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1960206774900659, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002686535722689693}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02974498876833475, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001087723908396391}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0728412590146272, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002755255015054753}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04154197887366649, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015125985867695552}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10507181677422107, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00149225380203505}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2427717881723433, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0035988198386666427}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14378872849238444, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00198471645496706}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.11365988678450253, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001665887050045974}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.26338940410019074, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00403257453510768}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.15577151588810306, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022348391906834657}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.6687565914580829, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.127910501427115}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_1.json b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..a9641ed3b8eda55a7492795cda9c7b7fa1c06641 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.21207140626368803, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0038581645356119865}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.27188028017390564, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004158828718436913}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.21898919375507106, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003161974309035466}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.04596243788195225, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002111260719585874}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.05792023485426218, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002400639714883728}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04653779891739668, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019224898943420372}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.1600433060616687, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003027321129900961}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.206195928854708, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0032318040465927613}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.16526315756844007, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00245003920287852}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.1624501288831014, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0030603591196422925}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.21143709654945458, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003493647295925758}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.16845087952441407, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002544682388183729}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.062682455534545, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1911179218893297}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_2.json b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..eacbf9bbd309a16018c2cef87c6f1436015471f8 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.23355885586659017, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0040933932598317116}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2385966987781216, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003652888212561435}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.22247490608623707, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00332374416018175}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.05016034446830836, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0024329093612370433}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.047696834799867076, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002112922260797895}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04588995604221001, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020485785234755694}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.17902471101461237, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003278248895415527}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.18313099716581613, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002898250408281982}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.17047566362303207, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002652593386481074}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.18054581744258855, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0032824682399233847}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.18603681066581088, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0030547982184099508}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.17233290863534617, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0026846916387991055}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.2377052996018123, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.18315337554830305}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_3.json b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..4188d2ee7d87c781d7e3c4f6e07461c600699d2c --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.22480297343691372, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004297306487708201}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.21981907620088453, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0039007807029761052}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.211112685269218, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0036478084958463525}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0473989148356509, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0023542959081873415}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.044786508086352, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021615066754731775}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04371921591233377, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002063160703719779}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.17077143836517153, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0034539784947908905}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.1674256007148668, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003116778223085841}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.16033960912306436, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0029061742252523438}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.1712430274478181, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0034669992286994146}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.16828003357354404, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0031669163990762543}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.16090737151266438, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0029284586568929447}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.4537857681806354, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.23835395567516868}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_4.json b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..b4ac7196a830f0b6fd39c72688da310d5d762149 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.06628555493620722, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004121834877690951}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.05298448052806384, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0032156118972841035}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.053717624136713174, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003166748644311415}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.013816123034397583, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0015174056131048437}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.011050060864432654, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0011409900901498005}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.01137342409219753, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011652172138052154}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.05250005230639445, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003454023255202736}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.04113648447989776, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002572146944390479}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.04172792112777844, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002524762753775506}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.05270496397071321, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0034548599492127143}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.04137383186582083, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025707709423569134}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.04194082850704681, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0025260321014198834}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.07986347109541274, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0177976863312144}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_5.json b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..f3d4a24e821b82cbf7ab03f2b384c1a988cfd042 --- /dev/null +++ b/perplexity25/evaluation/generation/agg.perplexity25_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0008576329331046312, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0008576329331046343}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 4.2881646655231564e-05, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 4.288164665523099e-05}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 8.167932696234583e-05, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 8.167932696234837e-05}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0008576329331046312, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0008576329331046343}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 4.2881646655231564e-05, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 4.288164665523099e-05}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 8.167932696234583e-05, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 8.167932696234837e-05}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0008576329331046312, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0008576329331046343}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 4.2881646655231564e-05, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 4.288164665523099e-05}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 8.167932696234583e-05, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 8.167932696234837e-05}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_0.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..67224c8742b3b109e26508306fa874d0b21189ee --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:822ad3f74e0175bec275b1ff62e5e218dbc48824602df00e7b080948f79d7ce5 +size 4116577 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_1.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..87d2ff0ed5722c73ee825a8b5d81bab9329438f1 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb6764c9d8e6e92516839b17b60ed38f073d8b29db8dfbb3cc557e983bf6d054 +size 4743197 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_2.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7e61710e7a5285d48edfd766b30098fdc0d3450b --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddf0e54dfa2f50631318b031d3c569010511709e3a2ef16bbb75fa7b9bb8a0c6 +size 5688480 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_3.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c8bba2210a946c0fe29b9a5cc26b601c020abb9f --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e44fc56fbd1f3a533d7e72e1363db0b4ecce81f1c8d1ab0e0cf52549221152a0 +size 6584294 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_4.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4a6a937a99a5b4515721e52f0fbea8faaa7b571a --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09e32bf9fc5fbc72594e3474a93a96e1ff87d661f40cbb8f22d515736450a2fa +size 7463401 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_5.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..61faf3db14a42beecf7c9d1f74e651b0e5696bd4 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34134578187633f9cba98670499c4c03acf39e57d1227d7e27b2a2ce33e36fb1 +size 8342477 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_0.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..323daf01cd2a4bef717340c4d3560132c150b060 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b0fcd28269b4ac56f41923c7503d52070ac78938aae7fdb7a49050cff780c5a +size 7497261 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_1.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c8453fa73250d420f1a86764388fd04331467d6e --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:560805bffb111d753be13678d4be2cb35ae26fc8f09de249b0d5b83a2f69b673 +size 12965254 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_2.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ea64a998302a985a592fff17b7e0192cef831729 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59f6c7ddebc47dce22241a79dc34d620fbbed5ffe0ba77f3325f41d56866733a +size 18491446 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_3.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1e258da6f8540502f54dc6ebf0871e1e5f5d9163 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0f806d48de7e5c6903dee254acb740440974a312d32df7dec8e88f5fc08a2c4 +size 23973466 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_4.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..bba2e07981b4c5be60b36c8d6743329a1d182ba3 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:666bf3b6d1839589ce3587b865eb9ae48268705d3b7db8f0f05e9cdb22ca0018 +size 29357477 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_5.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4cbc4f57880381eedea1e79d5b748aa4fd0cfdc7 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f770885124179ee129bd4e77a83015cd87d23126b4ee5c517c1c8abd2ce0c401 +size 34781244 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0918c7756f5d88a405ebf6db7f1fef403495088a --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df449942c907500be636599ed22ac295fcb2c0f9dab147917bd789bf1f45b26f +size 4292925 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..976c2cad865821c68167c2d60aed4d9a25b61ac2 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a42389d7c695170b293218ff9043112d9ef5895daa4cab280c4a2731a9d087b +size 5023162 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..287928cb001a0893536bf707aaec120d8c04c1d3 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c09811728119b3f3eaa6108c402dadc508a59dc3cdb8e68be8468947fce4938b +size 6118598 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..eea464bf903605e3ad0e8cb5ba33d0cfd4e585c8 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb3151eebf9c91836bba24b5a49af3fec6d7ff70c107e215a2619a04c5830e88 +size 7204798 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c2becc2260ff3e1dbaa1fc1a66f8ead41a598d6f --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c171c1c67513ec972cd3a674881b35f3030357ec5c1851cb5af8fd7f6305226 +size 8274656 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a831ece93581209096350117ca1beff68b733d73 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:433b2191a17e274847f2ab4cb5c96fcd32d828243f7ec5b1f9b6b621de7ae4ff +size 9359659 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_0.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..cf51970397edc701c99e10095ef0089c93befc2c --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e29cdba3357771939829ae254498d46b925e427508fbd2a771af872c69894c8a +size 2822430 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_1.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..bc60732255d49e2c5a9154a898f5cb835f9228f5 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce33d1a49965fd2568b13c7a0c9d63966b51a0565eada576840de5041c4dca74 +size 4970026 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_2.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..475f2bc697265f413fe62f0c35d66d7f59a08869 --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d26a92d135b644879a58d87b302a2afe1931fb5be1f2ba66ba90734a07ca6b88 +size 7195169 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_3.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..429533f2e04f08dabdfc203055fd3c572b90e8ad --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b09b0dc61f8dc807cb10b0edacdcc4ff99884106d73aa1cf7d139103ac571c73 +size 9465771 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_4.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4e47e36539b5963c575c1e37be88877362b7d4dc --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e04284564213478747c8786c2499ac0c6894dbb578852bf16ccb02382554924 +size 11628177 diff --git a/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_5.jsonl b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f4764f96e576ed0222e9845f0582c60e254ecf7f --- /dev/null +++ b/perplexity25/evaluation/generation/examples.perplexity25_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08441f44b7726f7d8cb8f98df1e8d6ae6adcf91b66eaaff9b981508b523fa077 +size 13896053 diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_0.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..7ec9230fd06a9f908f5b5560ccbe8e532c6fc790 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.35947270396511505, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03976947372157981 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07545439815870926, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0022680323540535106 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3521835615440358, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00619686620162303 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10839552028832326, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0021723652033459194 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.032699451519105735, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001384275605757562 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.15406776335401268, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003465085716143713 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.047276019716226934, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012856377731630094 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07039855492701995, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0020974056683073722 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3340045099502354, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.005873382118908422 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10130202856745985, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0019472676322570249 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07004936083081541, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002133247465940297 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3244285334323993, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.005600594696630026 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10030698310345207, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00199704924468202 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_1.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..38bdc504655d65b3112aa4d0a571bde414e05920 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.439590405391749, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03639316276575898 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.11798108343049835, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004189810027811706 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.282170938801227, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004883544121946002 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12947090595404617, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002852782352526057 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.05196889371341826, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0025533461681694508 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.13218044825747446, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0032380010251441865 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05808665518589103, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0017777894288570288 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.10825494458392844, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.003904994298291327 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2645472840621899, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004556021445746197 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11858785172635401, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.002478780617084794 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.11031861099356242, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0039604815937864905 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.26713799982719905, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004549761006024966 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.12077915827100709, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002551676685757977 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_2.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..3f2b5f689da3213275777792fa9af39e6fef1509 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.4327894307296322, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.024640640059482456 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.12297046315173006, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0040897147406697325 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3042534732622601, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004903877544018215 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.1410031634689578, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0032324876149143174 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.0576039991584552, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0025535933466243133 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.15077982517511446, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0034374572449847826 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.06752669346406527, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0021138358803451953 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.1104912096950109, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0036047067672774166 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.28546625761473593, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004574662165094106 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.12796808140720628, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0027316442230635152 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.11307661210149669, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.003718228549147224 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2874301444825106, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00459624777457841 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.13012460046320815, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002821583895708515 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_3.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..7f0ff21d178326af441d840cc080639e6c29d70e --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5404686599298022, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.022697653617625668 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.13845802128499135, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0045597656509502645 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.32092040425844226, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005008296587989612 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.15560884002865294, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0036234626616506445 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.06702437748497692, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0029685771305559 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1620667235472547, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0036340890774095654 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.07669311585498696, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.002447936846513278 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.12473752815218381, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004101879009707582 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2996525326692619, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004604365063870675 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1408131779527577, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0031033792829699013 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.1278080751942467, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004213519190229 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.30254217709571163, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0046415976176704355 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.14358670900260256, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0032033835693374485 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_4.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..eb151016e32ad35cff6f879aac9d4cf3bc43870a --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5742337786019259, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03878274750055446 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.14086556381172718, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004428332001204429 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.32551921944528406, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004991227840335665 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.1600235914525449, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0036097572997394753 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.07032835967682173, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.002913207949737097 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1657469934541477, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0036471777846592795 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.07941872657600588, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0023817203208560513 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.1253787475855925, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.003857417568887736 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.30410641236844715, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004626592417361122 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1440562866504595, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0030403449385889405 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.12869971530300842, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.003968071565769882 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3075445892543285, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004678706009218115 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1472101403273607, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.003138866129665981 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_5.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..dc100cc73e5c239878acf665a3d94a825800c98e --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.635110535837625, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03871788894965444 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.1525500458853948, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004620561884453087 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.33136495455869663, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004922267534666466 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.16874449129697527, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.003695736819713046 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.07343448799144045, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.00283017590959593 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.16823943214461987, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003586567555229492 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.08341646218330169, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00245206001866393 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.13575531369040605, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0040450583472974805 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.30873860481408066, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004580652118490307 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.15194218033858106, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003180047227446292 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.13990818551922082, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004203614112801349 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.31270960518749086, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004631706988744322 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.15546806288792936, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0032849232577235156 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_0.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..4dcae16d11bd27e1a9472d5b0fd0f9572fd80737 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.14065522911885284, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0026167234065659377 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2077858455356502, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.003207547563015362 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.15054961097467578, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.00226377650907843 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.028936499156918462, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008308890956254622 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.047621572002057626, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0014677026992242054 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03284973650336109, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008901474353695594 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.10891616878029095, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002128146385613769 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.16364999329689073, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0025474652737291228 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.11606660794433771, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016651813354424878 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1297853946244735, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0024785686496660475 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.1912754353743984, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002981659373353225 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1383437322796597, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002090310705469885 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.9837825625170797, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.11075715745007846 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_1.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..0a9d6334ade9e369c3ca31475c37672bcd171409 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.2762425105029227, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.003910267300588051 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.20834745854239614, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0027380965011137614 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1947910450168483, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020869483396049704 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.08055553948421161, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.002606559746437613 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05150103955877206, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0014183315910517708 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.049392514158574624, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012208161442090015 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.21851702868734507, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.003372441044700006 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.16057548751118275, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002148069814749071 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15001937245323257, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015991824476393945 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.25916065316674775, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0037279536032471168 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.19441611485589055, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0025510292731691516 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.18180570375726848, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001936138194096433 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.731757866860902, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.09401566144028131 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_2.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..6b58a69f40f320d226d6e82d96fe40ef0162e414 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.32626754575036726, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004160952183668717 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.20383479538093535, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0026993794458441043 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.20613936702027444, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0021190894920928268 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.10007636311761049, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0028550431288296794 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.054415586299804586, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0013915187854267616 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05603389382170741, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001271062816942248 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.2635619488392546, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0036380974285539374 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1603578397536738, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002146919731505488 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.16252489097757244, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016718094991769424 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.3074344862627562, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004014028577734544 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.19073199447466943, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002535477745360056 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1931517785284218, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001993853381084745 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.9322639050220105, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.12143454557270413 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_3.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..8889e6c0ca30bf55007cf0a1d6696fa472a283dd --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.2922725222200554, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004651782939278748 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.16905603244144393, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002893722815519241 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17399824491538346, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0024206540471267573 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.09252698046948368, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.002866844020761 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04722768100471586, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001416812413385918 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04907480009549843, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012971765065339716 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.23838599830741092, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004037065243320852 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.13345263947824532, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002299889404388408 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13802926833801735, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0019272093177852146 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.2757198208371055, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004460275498557492 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.1579566276306941, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027014936394507074 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.16286062730037856, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00226402618082299 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.012414052522073, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.1192976063075274 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_4.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..0567615da37a66d37615a2546b6e4282de9d6f0b --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.09803780862444332, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0037542079984195773 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.055939650256776254, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002208174292715702 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.057375310609982466, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002066242545550384 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.03142995177369586, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0021038457526255747 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.015365143064306497, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.000979165685417275 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0160305041705034, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009438720743795962 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.08097565827758714, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0032427815281044717 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.04471738861035188, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0017641789615113678 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.04608597234875565, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016726995424030213 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.09182775554453593, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.003564574100593056 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.051912990141086475, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0020473017772187473 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.05329542007268218, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019209202512399431 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.03493647315810699, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.005631810107220299 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_5.json b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..d599a45632596bf619e84832103507ffa1f44e71 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.016993736073454134, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001788546858364124 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.00900637633671815, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0010107140778820775 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.009395500241536013, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0009500689605104234 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.006211648856695909, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0010267488110128425 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0026828841173024234, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0004381628666649999 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.002851312099021117, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00041531186668653793 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.01439613464214093, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001575501685496224 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.0074140396273133825, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0008325976973129966 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.007773827425357832, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0007949106358400926 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.016125128414415275, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.00172636694363769 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.008465582889960955, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0009496466031975232 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.008833738275831978, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0008974890832248417 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.8561305401207938e-16, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 6.947302305993717e-14 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.json b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..406bb09067b4eea9f03252c4cd3ee19b75b6e5b0 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 5.339927044871696, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.08872791568340165 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.2515052662950541, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.004870810614140465 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.3350266606904938, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0035843768019540086 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.2226828217679673, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002249745722118871 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.16308756446343287, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0051770263257276935 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.14336931732901514, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002169181508375878 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.0962466409781981, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0013503218785409525 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.22734045427809546, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.004892427330623474 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.28693034972602244, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002969166803920127 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.19096195261765536, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0018135664975555404 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.23625674969124535, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.004917569426738765 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.30234122307959604, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0033569459426124634 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.20222274630326326, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002112367456590073 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.json b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..24ead5fae35134a5b7125cfde8ad517fb23aa305 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 10.995645416426365, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1355301364434119 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5186991843866234, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003179740997511602 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4184117679002587, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028975710111925493 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.43760763192725927, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002294835733825743 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2385007362385778, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0024817174189763467 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.19034676067668307, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0020882764951960587 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.19885963206818635, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019191251133340809 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.37694670026209454, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0027655570482716324 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.30206571148255096, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002359583500618676 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3161353012742636, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0019606253829224825 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4227955643807066, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0030366933000180126 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3403465420378745, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002668047106474485 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3559670164748496, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00223874305132682 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.json b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..e83c1d0dbbc09bd09f0ac5ed4d2c901693af3d01 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.721286940077317, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.19094329154612846 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5229324602091411, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031909121835382993 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4401132076058208, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002805311642371223 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4535479079186711, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002205157637138293 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2525772319738568, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002506980505193317 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21097394329000255, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002155594256646686 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.21668784494769056, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019317691466643027 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3865460480893656, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0027749325148882765 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3249916440696209, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002413104785614359 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3345469747204765, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0019950150742453652 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.43548565683836865, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003060969562227986 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.366407031063428, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026844596720968987 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3773720477580653, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022315833379365027 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.json b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..2a204940d712985caf583fcf35c4d61354e17c62 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.531244841347167, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.14804992137109332 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5201401768255047, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003087529662537695 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4499141314413611, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027731042114211733 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4602006690975045, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002202958672501332 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2537225301220307, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0024510739744713675 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2184563815633649, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002176238990613196 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2226349693599192, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001956593053550091 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.38767169950748886, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002705530894575463 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.33483483642414963, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023947056400905062 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3422005085679842, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001990890594788978 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.43884036572466234, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002991792920013415 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3796460763325496, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002674393195242478 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.38814660645876126, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022505112996719723 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.json b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..2f72e40cf44dca87c8debcfd39a364905682ee2d --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.144641083132381, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.22425257366332665 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5172514001918539, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003026409634009829 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4404595087274305, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002720085033791889 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4543948636144128, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.00216936378243014 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2515805000837444, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0024310452140277675 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21291756885767313, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002148428865602042 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.21910499180486853, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019460167284822956 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3890522315214248, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002719821689066892 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.33026355455414214, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023774186515219294 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3408417131350513, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002007724984778065 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.43842236175255295, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0029826343953932937 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3729149211806265, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026547829705833277 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.38474418787643466, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00224573532936523 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.json b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..ce2be28e53fa7b57f6882b4327abd611f9e37bd5 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.123048347593052, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.17809694322426664 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.517549307513542, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031180867210341256 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.43869061890223154, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027334989737563755 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.45359810879893614, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022034543872964845 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2511077989934143, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0024722315716345553 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21132059138033674, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021474197073557645 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.21805791826958687, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001957141790282348 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.39019517006735716, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0027358415117223725 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3300349352658418, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023622100586565727 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.34126459914946794, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001998609558923375 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.440642917422858, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0030367113114780704 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.37286555921974923, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026300003525580365 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3858165011376146, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002254962578090558 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_0.json b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..50b03505762240e1d1b53b0988bbb283b4ba3468 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.14334820197523107, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002033372138397688 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.32917310914311515, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.00467334236894172 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1960206774900659, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002686535722689693 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02974498876833475, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.001087723908396391 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0728412590146272, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002755255015054753 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04154197887366649, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0015125985867695552 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10507181677422107, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.00149225380203505 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2427717881723433, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0035988198386666427 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14378872849238444, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.00198471645496706 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.11365988678450253, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001665887050045974 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.26338940410019074, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.00403257453510768 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.15577151588810306, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0022348391906834657 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.6687565914580829, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.127910501427115 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_1.json b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..9cf70c1f852a819638b3f113c148fbcc9d09d91c --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.21207140626368803, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0038581645356119865 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.27188028017390564, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004158828718436913 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.21898919375507106, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.003161974309035466 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.04596243788195225, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.002111260719585874 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.05792023485426218, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002400639714883728 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04653779891739668, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0019224898943420372 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.1600433060616687, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.003027321129900961 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.206195928854708, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0032318040465927613 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.16526315756844007, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.00245003920287852 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.1624501288831014, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0030603591196422925 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.21143709654945458, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003493647295925758 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.16845087952441407, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002544682388183729 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.062682455534545, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.1911179218893297 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_2.json b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..627a63c2ec9676ba548e1b37d5e582e39fd419f6 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.23355885586659017, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0040933932598317116 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2385966987781216, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003652888212561435 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.22247490608623707, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.00332374416018175 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.05016034446830836, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0024329093612370433 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.047696834799867076, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002112922260797895 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04588995604221001, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0020485785234755694 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.17902471101461237, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.003278248895415527 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.18313099716581613, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.002898250408281982 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.17047566362303207, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002652593386481074 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.18054581744258855, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0032824682399233847 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.18603681066581088, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0030547982184099508 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.17233290863534617, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0026846916387991055 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.2377052996018123, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.18315337554830305 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_3.json b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..d0091884c1ce5911c0805fbbc0d7a8c6a7215ca5 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.22480297343691372, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.004297306487708201 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.21981907620088453, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0039007807029761052 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.211112685269218, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0036478084958463525 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0473989148356509, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0023542959081873415 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.044786508086352, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0021615066754731775 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04371921591233377, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.002063160703719779 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.17077143836517153, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0034539784947908905 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.1674256007148668, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003116778223085841 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.16033960912306436, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0029061742252523438 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.1712430274478181, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0034669992286994146 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.16828003357354404, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0031669163990762543 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.16090737151266438, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0029284586568929447 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.4537857681806354, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.23835395567516868 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_4.json b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..6dd16b69462e2950b076ed889be76b8e41250969 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.06628555493620722, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.004121834877690951 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.05298448052806384, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0032156118972841035 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.053717624136713174, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.003166748644311415 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.013816123034397583, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0015174056131048437 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.011050060864432654, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0011409900901498005 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.01137342409219753, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0011652172138052154 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.05250005230639445, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.003454023255202736 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.04113648447989776, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.002572146944390479 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.04172792112777844, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002524762753775506 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.05270496397071321, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0034548599492127143 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.04137383186582083, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0025707709423569134 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.04194082850704681, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0025260321014198834 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.07986347109541274, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.0177976863312144 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_5.json b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..7236851211b3d77123456a29d38c18bfb15d1386 --- /dev/null +++ b/perplexity25/evaluation/generation/slim.perplexity25_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0008576329331046312, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0008576329331046343 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 4.2881646655231564e-05, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 4.288164665523099e-05 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 8.167932696234583e-05, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 8.167932696234837e-05 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0008576329331046312, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0008576329331046343 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 4.2881646655231564e-05, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 4.288164665523099e-05 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 8.167932696234583e-05, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 8.167932696234837e-05 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0008576329331046312, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0008576329331046343 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 4.2881646655231564e-05, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 4.288164665523099e-05 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 8.167932696234583e-05, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 8.167932696234837e-05 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.0 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-2b8-55b-oscar-perplexity/perplexity25/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/rankeval/perplexity25_0.json b/perplexity25/evaluation/rankeval/perplexity25_0.json new file mode 100644 index 0000000000000000000000000000000000000000..844a10451fa10abba2beef4c12193074c86b7a9f --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.35, + "acc_stderr": 0.015090650341444231 + }, + "anli_r2": { + "acc": 0.325, + "acc_stderr": 0.014818724459095526 + }, + "anli_r3": { + "acc": 0.3458333333333333, + "acc_stderr": 0.013736245342311012 + }, + "cb": { + "acc": 0.35714285714285715, + "acc_stderr": 0.0646095738380922, + "f1": 0.24550264550264553 + }, + "copa": { + "acc": 0.73, + "acc_stderr": 0.0446196043338474 + }, + "hellaswag": { + "acc": 0.392850029874527, + "acc_stderr": 0.004873858323840779, + "acc_norm": 0.492531368253336, + "acc_norm_stderr": 0.004989224715784538 + }, + "rte": { + "acc": 0.5270758122743683, + "acc_stderr": 0.030052303463143706 + }, + "winogrande": { + "acc": 0.5588003157063931, + "acc_stderr": 0.013954975072834738 + }, + "storycloze_2016": { + "acc": 0.6830571886691609, + "acc_stderr": 0.01075965095145212 + }, + "boolq": { + "acc": 0.5470948012232416, + "acc_stderr": 0.008706176885837738 + }, + "arc_easy": { + "acc": 0.5871212121212122, + "acc_stderr": 0.010102837421104663, + "acc_norm": 0.5210437710437711, + "acc_norm_stderr": 0.01025069260202258 + }, + "arc_challenge": { + "acc": 0.2773037542662116, + "acc_stderr": 0.013082095839059374, + "acc_norm": 0.2901023890784983, + "acc_norm_stderr": 0.013261573677520774 + }, + "sciq": { + "acc": 0.822, + "acc_stderr": 0.01210216767618359, + "acc_norm": 0.747, + "acc_norm_stderr": 0.01375427861358708 + }, + "piqa": { + "acc": 0.6964091403699674, + "acc_stderr": 0.010728079893076345, + "acc_norm": 0.6920565832426551, + "acc_norm_stderr": 0.010770892367463675 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/rankeval/perplexity25_0_lm-eval_global_step52452_2023-05-13-13-44-09_0shots_backup.json b/perplexity25/evaluation/rankeval/perplexity25_0_lm-eval_global_step52452_2023-05-13-13-44-09_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..844a10451fa10abba2beef4c12193074c86b7a9f --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_0_lm-eval_global_step52452_2023-05-13-13-44-09_0shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.35, + "acc_stderr": 0.015090650341444231 + }, + "anli_r2": { + "acc": 0.325, + "acc_stderr": 0.014818724459095526 + }, + "anli_r3": { + "acc": 0.3458333333333333, + "acc_stderr": 0.013736245342311012 + }, + "cb": { + "acc": 0.35714285714285715, + "acc_stderr": 0.0646095738380922, + "f1": 0.24550264550264553 + }, + "copa": { + "acc": 0.73, + "acc_stderr": 0.0446196043338474 + }, + "hellaswag": { + "acc": 0.392850029874527, + "acc_stderr": 0.004873858323840779, + "acc_norm": 0.492531368253336, + "acc_norm_stderr": 0.004989224715784538 + }, + "rte": { + "acc": 0.5270758122743683, + "acc_stderr": 0.030052303463143706 + }, + "winogrande": { + "acc": 0.5588003157063931, + "acc_stderr": 0.013954975072834738 + }, + "storycloze_2016": { + "acc": 0.6830571886691609, + "acc_stderr": 0.01075965095145212 + }, + "boolq": { + "acc": 0.5470948012232416, + "acc_stderr": 0.008706176885837738 + }, + "arc_easy": { + "acc": 0.5871212121212122, + "acc_stderr": 0.010102837421104663, + "acc_norm": 0.5210437710437711, + "acc_norm_stderr": 0.01025069260202258 + }, + "arc_challenge": { + "acc": 0.2773037542662116, + "acc_stderr": 0.013082095839059374, + "acc_norm": 0.2901023890784983, + "acc_norm_stderr": 0.013261573677520774 + }, + "sciq": { + "acc": 0.822, + "acc_stderr": 0.01210216767618359, + "acc_norm": 0.747, + "acc_norm_stderr": 0.01375427861358708 + }, + "piqa": { + "acc": 0.6964091403699674, + "acc_stderr": 0.010728079893076345, + "acc_norm": 0.6920565832426551, + "acc_norm_stderr": 0.010770892367463675 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/rankeval/perplexity25_1.json b/perplexity25/evaluation/rankeval/perplexity25_1.json new file mode 100644 index 0000000000000000000000000000000000000000..c5795019ace1b137eeb7dfac35d479ddf09969c9 --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.323, + "acc_stderr": 0.014794927843348635 + }, + "anli_r2": { + "acc": 0.342, + "acc_stderr": 0.015008706182121731 + }, + "anli_r3": { + "acc": 0.3475, + "acc_stderr": 0.013751753243291852 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.35057471264367807 + }, + "copa": { + "acc": 0.71, + "acc_stderr": 0.045604802157206845 + }, + "hellaswag": { + "acc": 0.392850029874527, + "acc_stderr": 0.00487385832384078, + "acc_norm": 0.4994025094602669, + "acc_norm_stderr": 0.0049897778487910105 + }, + "rte": { + "acc": 0.5126353790613718, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5351223362273086, + "acc_stderr": 0.014017773120881585 + }, + "storycloze_2016": { + "acc": 0.6766435061464458, + "acc_stderr": 0.010816828633068213 + }, + "boolq": { + "acc": 0.5348623853211009, + "acc_stderr": 0.008723771844458132 + }, + "arc_easy": { + "acc": 0.6022727272727273, + "acc_stderr": 0.010042861602178058, + "acc_norm": 0.5778619528619529, + "acc_norm_stderr": 0.01013462052459227 + }, + "arc_challenge": { + "acc": 0.2781569965870307, + "acc_stderr": 0.013094469919538798, + "acc_norm": 0.29180887372013653, + "acc_norm_stderr": 0.013284525292403511 + }, + "sciq": { + "acc": 0.875, + "acc_stderr": 0.010463483381956722, + "acc_norm": 0.863, + "acc_norm_stderr": 0.010878848714333315 + }, + "piqa": { + "acc": 0.6877040261153428, + "acc_stderr": 0.010812581599154424, + "acc_norm": 0.6936887921653971, + "acc_norm_stderr": 0.010754970032367323 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/rankeval/perplexity25_1_lm-eval_global_step52452_2023-05-13-13-44-09_1shots_backup.json b/perplexity25/evaluation/rankeval/perplexity25_1_lm-eval_global_step52452_2023-05-13-13-44-09_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..c5795019ace1b137eeb7dfac35d479ddf09969c9 --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_1_lm-eval_global_step52452_2023-05-13-13-44-09_1shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.323, + "acc_stderr": 0.014794927843348635 + }, + "anli_r2": { + "acc": 0.342, + "acc_stderr": 0.015008706182121731 + }, + "anli_r3": { + "acc": 0.3475, + "acc_stderr": 0.013751753243291852 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.35057471264367807 + }, + "copa": { + "acc": 0.71, + "acc_stderr": 0.045604802157206845 + }, + "hellaswag": { + "acc": 0.392850029874527, + "acc_stderr": 0.00487385832384078, + "acc_norm": 0.4994025094602669, + "acc_norm_stderr": 0.0049897778487910105 + }, + "rte": { + "acc": 0.5126353790613718, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5351223362273086, + "acc_stderr": 0.014017773120881585 + }, + "storycloze_2016": { + "acc": 0.6766435061464458, + "acc_stderr": 0.010816828633068213 + }, + "boolq": { + "acc": 0.5348623853211009, + "acc_stderr": 0.008723771844458132 + }, + "arc_easy": { + "acc": 0.6022727272727273, + "acc_stderr": 0.010042861602178058, + "acc_norm": 0.5778619528619529, + "acc_norm_stderr": 0.01013462052459227 + }, + "arc_challenge": { + "acc": 0.2781569965870307, + "acc_stderr": 0.013094469919538798, + "acc_norm": 0.29180887372013653, + "acc_norm_stderr": 0.013284525292403511 + }, + "sciq": { + "acc": 0.875, + "acc_stderr": 0.010463483381956722, + "acc_norm": 0.863, + "acc_norm_stderr": 0.010878848714333315 + }, + "piqa": { + "acc": 0.6877040261153428, + "acc_stderr": 0.010812581599154424, + "acc_norm": 0.6936887921653971, + "acc_norm_stderr": 0.010754970032367323 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/rankeval/perplexity25_2.json b/perplexity25/evaluation/rankeval/perplexity25_2.json new file mode 100644 index 0000000000000000000000000000000000000000..156668327db939c12b98b763fcabe36f8a8bd6e1 --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.324, + "acc_stderr": 0.014806864733738857 + }, + "anli_r2": { + "acc": 0.342, + "acc_stderr": 0.01500870618212173 + }, + "anli_r3": { + "acc": 0.345, + "acc_stderr": 0.013728421539454876 + }, + "cb": { + "acc": 0.375, + "acc_stderr": 0.06527912098338669, + "f1": 0.2619047619047619 + }, + "copa": { + "acc": 0.72, + "acc_stderr": 0.04512608598542128 + }, + "hellaswag": { + "acc": 0.3911571400119498, + "acc_stderr": 0.004870121051762732, + "acc_norm": 0.5040828520215097, + "acc_norm_stderr": 0.004989615052547474 + }, + "rte": { + "acc": 0.44404332129963897, + "acc_stderr": 0.029907396333795997 + }, + "winogrande": { + "acc": 0.5516969218626677, + "acc_stderr": 0.013977171307126345 + }, + "storycloze_2016": { + "acc": 0.6905398182789952, + "acc_stderr": 0.01068995674518907 + }, + "boolq": { + "acc": 0.563302752293578, + "acc_stderr": 0.008674684806135008 + }, + "arc_easy": { + "acc": 0.6052188552188552, + "acc_stderr": 0.010030038935883579, + "acc_norm": 0.5968013468013468, + "acc_norm_stderr": 0.010065668576794796 + }, + "arc_challenge": { + "acc": 0.2773037542662116, + "acc_stderr": 0.013082095839059374, + "acc_norm": 0.3037542662116041, + "acc_norm_stderr": 0.013438909184778768 + }, + "sciq": { + "acc": 0.889, + "acc_stderr": 0.009938701010583726, + "acc_norm": 0.88, + "acc_norm_stderr": 0.01028132801274739 + }, + "piqa": { + "acc": 0.6860718171926007, + "acc_stderr": 0.01082792813418964, + "acc_norm": 0.6882480957562568, + "acc_norm_stderr": 0.010807431424873669 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/rankeval/perplexity25_2_lm-eval_global_step52452_2023-05-13-13-44-09_2shots_backup.json b/perplexity25/evaluation/rankeval/perplexity25_2_lm-eval_global_step52452_2023-05-13-13-44-09_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..156668327db939c12b98b763fcabe36f8a8bd6e1 --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_2_lm-eval_global_step52452_2023-05-13-13-44-09_2shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.324, + "acc_stderr": 0.014806864733738857 + }, + "anli_r2": { + "acc": 0.342, + "acc_stderr": 0.01500870618212173 + }, + "anli_r3": { + "acc": 0.345, + "acc_stderr": 0.013728421539454876 + }, + "cb": { + "acc": 0.375, + "acc_stderr": 0.06527912098338669, + "f1": 0.2619047619047619 + }, + "copa": { + "acc": 0.72, + "acc_stderr": 0.04512608598542128 + }, + "hellaswag": { + "acc": 0.3911571400119498, + "acc_stderr": 0.004870121051762732, + "acc_norm": 0.5040828520215097, + "acc_norm_stderr": 0.004989615052547474 + }, + "rte": { + "acc": 0.44404332129963897, + "acc_stderr": 0.029907396333795997 + }, + "winogrande": { + "acc": 0.5516969218626677, + "acc_stderr": 0.013977171307126345 + }, + "storycloze_2016": { + "acc": 0.6905398182789952, + "acc_stderr": 0.01068995674518907 + }, + "boolq": { + "acc": 0.563302752293578, + "acc_stderr": 0.008674684806135008 + }, + "arc_easy": { + "acc": 0.6052188552188552, + "acc_stderr": 0.010030038935883579, + "acc_norm": 0.5968013468013468, + "acc_norm_stderr": 0.010065668576794796 + }, + "arc_challenge": { + "acc": 0.2773037542662116, + "acc_stderr": 0.013082095839059374, + "acc_norm": 0.3037542662116041, + "acc_norm_stderr": 0.013438909184778768 + }, + "sciq": { + "acc": 0.889, + "acc_stderr": 0.009938701010583726, + "acc_norm": 0.88, + "acc_norm_stderr": 0.01028132801274739 + }, + "piqa": { + "acc": 0.6860718171926007, + "acc_stderr": 0.01082792813418964, + "acc_norm": 0.6882480957562568, + "acc_norm_stderr": 0.010807431424873669 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/rankeval/perplexity25_3.json b/perplexity25/evaluation/rankeval/perplexity25_3.json new file mode 100644 index 0000000000000000000000000000000000000000..1ba27665266dd56723bcdd812bf4011098d60d96 --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.314, + "acc_stderr": 0.014683991951087966 + }, + "anli_r2": { + "acc": 0.348, + "acc_stderr": 0.01507060460376841 + }, + "anli_r3": { + "acc": 0.3458333333333333, + "acc_stderr": 0.013736245342311012 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.32804232804232797 + }, + "copa": { + "acc": 0.71, + "acc_stderr": 0.045604802157206845 + }, + "hellaswag": { + "acc": 0.39245170284803826, + "acc_stderr": 0.004872984492968002, + "acc_norm": 0.5030870344552878, + "acc_norm_stderr": 0.00498968630748455 + }, + "rte": { + "acc": 0.4981949458483754, + "acc_stderr": 0.030096267148976626 + }, + "winogrande": { + "acc": 0.5453827940015785, + "acc_stderr": 0.01399448102706599 + }, + "storycloze_2016": { + "acc": 0.6814537680384821, + "acc_stderr": 0.010774165229761346 + }, + "boolq": { + "acc": 0.5703363914373089, + "acc_stderr": 0.00865809540849789 + }, + "arc_easy": { + "acc": 0.6073232323232324, + "acc_stderr": 0.01002064655553869, + "acc_norm": 0.609006734006734, + "acc_norm_stderr": 0.01001299223254063 + }, + "arc_challenge": { + "acc": 0.26706484641638223, + "acc_stderr": 0.012928933196496342, + "acc_norm": 0.29948805460750855, + "acc_norm_stderr": 0.013385021637313565 + }, + "sciq": { + "acc": 0.893, + "acc_stderr": 0.00977991035984717, + "acc_norm": 0.882, + "acc_norm_stderr": 0.010206869264381791 + }, + "piqa": { + "acc": 0.6947769314472253, + "acc_stderr": 0.01074426704560648, + "acc_norm": 0.6996735582154516, + "acc_norm_stderr": 0.010695225308183143 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/rankeval/perplexity25_3_lm-eval_global_step52452_2023-05-13-13-44-09_3shots_backup.json b/perplexity25/evaluation/rankeval/perplexity25_3_lm-eval_global_step52452_2023-05-13-13-44-09_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..1ba27665266dd56723bcdd812bf4011098d60d96 --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_3_lm-eval_global_step52452_2023-05-13-13-44-09_3shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.314, + "acc_stderr": 0.014683991951087966 + }, + "anli_r2": { + "acc": 0.348, + "acc_stderr": 0.01507060460376841 + }, + "anli_r3": { + "acc": 0.3458333333333333, + "acc_stderr": 0.013736245342311012 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.32804232804232797 + }, + "copa": { + "acc": 0.71, + "acc_stderr": 0.045604802157206845 + }, + "hellaswag": { + "acc": 0.39245170284803826, + "acc_stderr": 0.004872984492968002, + "acc_norm": 0.5030870344552878, + "acc_norm_stderr": 0.00498968630748455 + }, + "rte": { + "acc": 0.4981949458483754, + "acc_stderr": 0.030096267148976626 + }, + "winogrande": { + "acc": 0.5453827940015785, + "acc_stderr": 0.01399448102706599 + }, + "storycloze_2016": { + "acc": 0.6814537680384821, + "acc_stderr": 0.010774165229761346 + }, + "boolq": { + "acc": 0.5703363914373089, + "acc_stderr": 0.00865809540849789 + }, + "arc_easy": { + "acc": 0.6073232323232324, + "acc_stderr": 0.01002064655553869, + "acc_norm": 0.609006734006734, + "acc_norm_stderr": 0.01001299223254063 + }, + "arc_challenge": { + "acc": 0.26706484641638223, + "acc_stderr": 0.012928933196496342, + "acc_norm": 0.29948805460750855, + "acc_norm_stderr": 0.013385021637313565 + }, + "sciq": { + "acc": 0.893, + "acc_stderr": 0.00977991035984717, + "acc_norm": 0.882, + "acc_norm_stderr": 0.010206869264381791 + }, + "piqa": { + "acc": 0.6947769314472253, + "acc_stderr": 0.01074426704560648, + "acc_norm": 0.6996735582154516, + "acc_norm_stderr": 0.010695225308183143 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/rankeval/perplexity25_4.json b/perplexity25/evaluation/rankeval/perplexity25_4.json new file mode 100644 index 0000000000000000000000000000000000000000..b1e3b9a6df8682bbd2e4064e871f89858586ec55 --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.328, + "acc_stderr": 0.014853842487270334 + }, + "anli_r2": { + "acc": 0.359, + "acc_stderr": 0.015177264224798596 + }, + "anli_r3": { + "acc": 0.3433333333333333, + "acc_stderr": 0.01371263383046586 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.0672477765493766, + "f1": 0.3090815273477812 + }, + "copa": { + "acc": 0.73, + "acc_stderr": 0.044619604333847394 + }, + "hellaswag": { + "acc": 0.39294961163114916, + "acc_stderr": 0.004874076250521575, + "acc_norm": 0.5014937263493328, + "acc_norm_stderr": 0.004989759144812297 + }, + "rte": { + "acc": 0.47653429602888087, + "acc_stderr": 0.03006330041190266 + }, + "winogrande": { + "acc": 0.5485398579321231, + "acc_stderr": 0.013986110301017759 + }, + "storycloze_2016": { + "acc": 0.6873329770176376, + "acc_stderr": 0.010720223172953174 + }, + "boolq": { + "acc": 0.5681957186544343, + "acc_stderr": 0.008663332644225124 + }, + "arc_easy": { + "acc": 0.5989057239057239, + "acc_stderr": 0.01005705110653437, + "acc_norm": 0.5976430976430976, + "acc_norm_stderr": 0.010062244711011508 + }, + "arc_challenge": { + "acc": 0.2713310580204778, + "acc_stderr": 0.012993807727545782, + "acc_norm": 0.3122866894197952, + "acc_norm_stderr": 0.013542598541688067 + }, + "sciq": { + "acc": 0.895, + "acc_stderr": 0.009698921026024961, + "acc_norm": 0.892, + "acc_norm_stderr": 0.009820001651345694 + }, + "piqa": { + "acc": 0.6980413492927094, + "acc_stderr": 0.010711732891588357, + "acc_norm": 0.6980413492927094, + "acc_norm_stderr": 0.01071173289158834 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/rankeval/perplexity25_4_lm-eval_global_step52452_2023-05-13-13-44-09_4shots_backup.json b/perplexity25/evaluation/rankeval/perplexity25_4_lm-eval_global_step52452_2023-05-13-13-44-09_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..b1e3b9a6df8682bbd2e4064e871f89858586ec55 --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_4_lm-eval_global_step52452_2023-05-13-13-44-09_4shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.328, + "acc_stderr": 0.014853842487270334 + }, + "anli_r2": { + "acc": 0.359, + "acc_stderr": 0.015177264224798596 + }, + "anli_r3": { + "acc": 0.3433333333333333, + "acc_stderr": 0.01371263383046586 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.0672477765493766, + "f1": 0.3090815273477812 + }, + "copa": { + "acc": 0.73, + "acc_stderr": 0.044619604333847394 + }, + "hellaswag": { + "acc": 0.39294961163114916, + "acc_stderr": 0.004874076250521575, + "acc_norm": 0.5014937263493328, + "acc_norm_stderr": 0.004989759144812297 + }, + "rte": { + "acc": 0.47653429602888087, + "acc_stderr": 0.03006330041190266 + }, + "winogrande": { + "acc": 0.5485398579321231, + "acc_stderr": 0.013986110301017759 + }, + "storycloze_2016": { + "acc": 0.6873329770176376, + "acc_stderr": 0.010720223172953174 + }, + "boolq": { + "acc": 0.5681957186544343, + "acc_stderr": 0.008663332644225124 + }, + "arc_easy": { + "acc": 0.5989057239057239, + "acc_stderr": 0.01005705110653437, + "acc_norm": 0.5976430976430976, + "acc_norm_stderr": 0.010062244711011508 + }, + "arc_challenge": { + "acc": 0.2713310580204778, + "acc_stderr": 0.012993807727545782, + "acc_norm": 0.3122866894197952, + "acc_norm_stderr": 0.013542598541688067 + }, + "sciq": { + "acc": 0.895, + "acc_stderr": 0.009698921026024961, + "acc_norm": 0.892, + "acc_norm_stderr": 0.009820001651345694 + }, + "piqa": { + "acc": 0.6980413492927094, + "acc_stderr": 0.010711732891588357, + "acc_norm": 0.6980413492927094, + "acc_norm_stderr": 0.01071173289158834 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/rankeval/perplexity25_5.json b/perplexity25/evaluation/rankeval/perplexity25_5.json new file mode 100644 index 0000000000000000000000000000000000000000..5b1e7d129bdc4ef36bfd3afdccb03a2bf53e46f2 --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.344, + "acc_stderr": 0.015029633724408947 + }, + "anli_r2": { + "acc": 0.353, + "acc_stderr": 0.015120172605483689 + }, + "anli_r3": { + "acc": 0.3416666666666667, + "acc_stderr": 0.013696658778002515 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.32066849458153807 + }, + "copa": { + "acc": 0.72, + "acc_stderr": 0.04512608598542128 + }, + "hellaswag": { + "acc": 0.39314877514439356, + "acc_stderr": 0.004874511466836799, + "acc_norm": 0.4998008364867556, + "acc_norm_stderr": 0.00498978101559547 + }, + "rte": { + "acc": 0.5054151624548736, + "acc_stderr": 0.030094698123239966 + }, + "winogrande": { + "acc": 0.5516969218626677, + "acc_stderr": 0.013977171307126347 + }, + "storycloze_2016": { + "acc": 0.6857295563869589, + "acc_stderr": 0.010735132285108176 + }, + "boolq": { + "acc": 0.5700305810397553, + "acc_stderr": 0.008658853690729254 + }, + "arc_easy": { + "acc": 0.6069023569023569, + "acc_stderr": 0.010022540618945325, + "acc_norm": 0.6073232323232324, + "acc_norm_stderr": 0.010020646555538693 + }, + "arc_challenge": { + "acc": 0.27559726962457337, + "acc_stderr": 0.013057169655761838, + "acc_norm": 0.2960750853242321, + "acc_norm_stderr": 0.01334091608524626 + }, + "sciq": { + "acc": 0.904, + "acc_stderr": 0.009320454434783217, + "acc_norm": 0.894, + "acc_norm_stderr": 0.009739551265785134 + }, + "piqa": { + "acc": 0.6860718171926007, + "acc_stderr": 0.010827928134189643, + "acc_norm": 0.691512513601741, + "acc_norm_stderr": 0.010776164678037159 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity25/evaluation/rankeval/perplexity25_5_lm-eval_global_step52452_2023-05-13-13-44-09_5shots_backup.json b/perplexity25/evaluation/rankeval/perplexity25_5_lm-eval_global_step52452_2023-05-13-13-44-09_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..5b1e7d129bdc4ef36bfd3afdccb03a2bf53e46f2 --- /dev/null +++ b/perplexity25/evaluation/rankeval/perplexity25_5_lm-eval_global_step52452_2023-05-13-13-44-09_5shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.344, + "acc_stderr": 0.015029633724408947 + }, + "anli_r2": { + "acc": 0.353, + "acc_stderr": 0.015120172605483689 + }, + "anli_r3": { + "acc": 0.3416666666666667, + "acc_stderr": 0.013696658778002515 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.32066849458153807 + }, + "copa": { + "acc": 0.72, + "acc_stderr": 0.04512608598542128 + }, + "hellaswag": { + "acc": 0.39314877514439356, + "acc_stderr": 0.004874511466836799, + "acc_norm": 0.4998008364867556, + "acc_norm_stderr": 0.00498978101559547 + }, + "rte": { + "acc": 0.5054151624548736, + "acc_stderr": 0.030094698123239966 + }, + "winogrande": { + "acc": 0.5516969218626677, + "acc_stderr": 0.013977171307126347 + }, + "storycloze_2016": { + "acc": 0.6857295563869589, + "acc_stderr": 0.010735132285108176 + }, + "boolq": { + "acc": 0.5700305810397553, + "acc_stderr": 0.008658853690729254 + }, + "arc_easy": { + "acc": 0.6069023569023569, + "acc_stderr": 0.010022540618945325, + "acc_norm": 0.6073232323232324, + "acc_norm_stderr": 0.010020646555538693 + }, + "arc_challenge": { + "acc": 0.27559726962457337, + "acc_stderr": 0.013057169655761838, + "acc_norm": 0.2960750853242321, + "acc_norm_stderr": 0.01334091608524626 + }, + "sciq": { + "acc": 0.904, + "acc_stderr": 0.009320454434783217, + "acc_norm": 0.894, + "acc_norm_stderr": 0.009739551265785134 + }, + "piqa": { + "acc": 0.6860718171926007, + "acc_stderr": 0.010827928134189643, + "acc_norm": 0.691512513601741, + "acc_norm_stderr": 0.010776164678037159 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6af430356697ad9492e65c2df1b2ffec67b4c0ff --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ab1fa0159d26824f3ac338f720ae570e7b43120fd42ce14f1e71060d5ee82ac +size 131677719 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea6cf8c088abb96b72bf9a8ce2cb73f22caea85f --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3df742366789b3e7acf95542c7721973aaf0111e2af431251c395b7a9d55ad78 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c544965eaac8c3aafbc2ecb3c5a943dff5658b8 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4fc6b53ccd54903e2589c86738062fb9eeee0182ef896e2b45d1201e47c88d5 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95ed20f58ed151993477d6ad3f250094501fbec7 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22f48f35f212c111e17069bf11bec64bdaa3b1360aa27cadb53b8e49aa3246b0 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ab6e489cf6600d8f0a90619470c45b4a20febcd --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e2dacd05d4e9a989776e7205ea6b6ddd2aed05c22612ecb11276f57f14ef4e8 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a8ee48c0e9d86123b7f6d0726f00ddd12f650dd --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:265bc2f48a897fc81bc16408cf8a4f7955b0a1501c7e01b8859ecbc93f256bab +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46c571a15bedda0475318b614f73d1acec67bc01 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9c3af5f8ab069b628ac419e499a2b96fdcc254912a81cabfa7e70e5d1552079 +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ba192560fe1f71990c1f06657d5b57794b5e74f --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e94764f6be05e884d6008821cf36308df63406b53ba1a3d500305db7966c5b7 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d8cdbebdfeb2d90be88e66c99a7a98d9145a4b2 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a30c939cf298d0a36942288a1f6eae40faab410c21499a13eafe4b3c9de7ce28 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3ec0fdc67218c9e7aadeae86b8d24867f73d1e8 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5ced7d790d9d9b455f1c6cee8349e1efade817e2bd417234ef422790b847508 +size 131677869 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3102292027ab4f0d072eb6077c65bf95796ae64 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81078561887870a2ce28a7b902f49a39c3a7b5c447ef80e06676320ff9981312 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0cd6e57b08a8134e3cc78f2bc1c519f9eb10efd --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92a63bef09c768e1673b98de804cbf365d1c612697fd500579d4c6a4437a5b08 +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2dc284112623892ca12f25849073968f3e48bde --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f63e5e0221305d5eabea3676258410c526ad4cf62ce6acac27789acfdc4a25bf +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4b705728a214464c1bd3985bdaa8006f7750da9 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2985aa72dc97881d9a614e5f741fcb72fe475e33d5c2e1970458274c38effd7e +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e2c2d74839447ffea53b352c9e763d5512cecb8 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cd9747dee46b0234fd3293b38d5f3cdbe647f73c7486ce871f34c65c7af64e4 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e56d6637cfe6bc505eb6315d3d655899889d3455 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1b96d0f1c90b7fe893d6b9e2962370ec70762565faf244bec0b434f983a4467 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..520cdfa444c2e01561e3a706c32db004eba2c877 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:263f7d2b4f40cfd2b2e75b8d5cb94cf3da2b430888b3b3c45757f084cba3b0db +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..368df2356787a143d3033f4fee2a17d5ee2a6ab8 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eab1b8186de740352f5e86f5a82412a41b79ccbaa76332ae9d3c072a4a6fa4b +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e09c8fae256a50585bcff7b88e8a9be7d0c24a1 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f4b8464b4da5c95646c20c337d75aa0983519939c2617e7833dfe5af9147a96 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9ef4fa4971348dc0a20ca7d0a8e11dd65dda389 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c7eb833018f16e44d83c65224677c706ba41f643797f2122878949a90302ac4 +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fcc7fdb9c27bd535fe169ae350f16425cba1891 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4258e4d6c515d8a8a7c330723b849623310aaedd3ef4cf8b22b64118f2b23d34 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..113e5d55ba2fce4783d43f4aca56824692da9db3 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b11fa95f0ea081f9a2e23c65113f15d7d4e8ac279de037844362f995bb0cf8ad +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1c73fbe12609020822196188c55980d9ffbec43 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b7ee4c3292e67c96ec1981f7cdb29c559300f30fb142da2a563c8b2e4ff0acb +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6475bfb97e6d77182514495e544ca1169225bd1 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca4923d614601c0606ab8bbb48bb22e80d2c0202fa3da7c6c1d7cbabcc340521 +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a35796b13daac5a4f090a27df2707bdbc258d3b7 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca877a95a9a7493180779754f7794f4d14e38aaf9d8c8d6a423a8a1331cbd22a +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13e6b8cf3ed98aca913ae1e8309a51d317961399 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7453521215139c7cd13de46fcf88e1ac2b96991906d4ad5b10a9ab1bb9110712 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad14e8ed8faa87347fab3fde7fc2f48e3b61b96e --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6bc4b71a79c232fab84235eabeb3cc41654396db5064b3d3c619d2675a14640 +size 131677869 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e99849a19e8c5b3c5865a9e0633d1e1d3bddd951 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83807bf71d7f6997fe511bf3278327efc83157d76b0a5903c53b7469d95086a9 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f9e303a4a3fe1229538e4bcca3a97db03354728 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d6074b22c4ea85717779a8c14c13719e8faa7d77e217c43a2989b52671b1fb2 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e06540f2e64753f09c85ef1acbf805c1db7755ed --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4856cd67474e74582f7616ea2a12c68488a88152f346d543c32615dcd78ccd49 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebb222fa29f03a9d3c200a985a1a482dad8d360c --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16a54f8b246ded1f6e4913045b5709af4741110b08060aaa4c9eb85a639c4606 +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..552c99deb6d808d2cc50e687538ed908f5621aed --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfc19a618450aab92f4f179c24d932c953fa26f0bd0ae99e50095789ab54a061 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9eb257ccbed768ba85b211bc8da9ef4090dd735a --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:704e0a8f43ba1e42d2f52bd0077fb7adba6eebf5bb9bb0db25e05b3aa1406039 +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6085bfdfe7449ccc6fe23ebde25d1bb2faf268ed --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a01dabcb41c07632370e9ee65a095d5e7a7cde55fecd47dd5aca90520911fbe +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d2eb77b771e4906253faef49d691771b3bf3c24 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55abafab7524db72f7c72cca38d481f2b6775d9baa0e1bca3ab6121fcb79fed6 +size 131677869 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9686f635e9f74c8069662a7144df72e844af3ae6 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faf35a60e67f8c4aee39ec80d98462fcfd71a61a0745780548d758d1c70bd7f9 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..578c3aa15bc72c22fa7f0facfb492f5deddfdedb --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38731f61d9f5aba0120e654e0a63f269f23a3e580eb1b9665c198f0088d67242 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f32b1a5ddd8aa8703a4f5a12a18f43b83f9d15a --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a0c95deb681b9dea174f85da917ef4690d0e03076a185898407f040fadc8ced +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09d085f2652ac52355ecdc1f325b5c96a4f91086 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:563a0a7472944811e5f37b9b1c7d33bc42823294c457ad9c40b22fce65367472 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..353ddbac57e0b9fce4fcc006860906e5e998e624 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38656be8578eee7e81ff8af5cf226945c0719d4764e32d49dacbe2d622451c6e +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab7b572e22158a8c77e736da6459b02cd215bea9 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3de5f4b48bf9e4468f4b94997f8156da4e3768400b68d9a3f1862063281dcf8f +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e9f850f33ef5d4e0eb02117fe9b896e767a4580 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a822a79a2706dfc40e261e179a80d11133748644b01e89998caa279169d5a64 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb64b0747729118e7d4e4b7bc50dcd6ed82adc08 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4e254818305514bb977163a48e59ad2c120e1c185084d5b294d75a14dc7592d +size 131677869 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37899176e69451f9bb8ff6cd1ddd92660ab7f30d --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fb2682ac6f3470086e92325273ea3c9e27582830b85376724feb15b898df429 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b6ac408a3516ceedfcecf8cde8711f1e789f2ae --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:807b1dc02e06051dc25511eadb92054c886701187447bec8076955dbeed7c75b +size 131677666 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..132e213954fa4ddefb7416789a24b7a4b0f01ad8 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:978f56d31a78a045a3dcac423c07b2b3ec1fce9bccc6d6e884e3e5434d21b916 +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75fe4a93f3fa8f471a67c7e93956ab43a63bb391 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86324a8a007b4e5ae08459f0aff9c2bbcde51f51159a861ff9a729755094a374 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb35366ff5f62dd2495074baecb7c7025486bf2d --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e194b9d0582448c435290587d7135770f77b59219fbefa39f66eb4b522491721 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca54ba594d0a89a85b4825f3d5efb613efbfd010 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab4d08aba0109022743d22b43bd4e5dc0e28a5e1d7e5f32f738e7369861ac0b4 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cf2c711a593f0753c6469be4bcff8f57f529fce --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e7156cbe3c91087d6689b11c75ae3368a970505f3a4880d89598c3be76d51d9 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb69b8eea98f32c8d9159ada3dd571e9b1e5ccd9 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56c21598f58898e37590fc08d26a70deb7feb7db6b37fbb1231899384bc367a3 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c7325f2e6f6d6aff518bdbd1e12c190dc94ba15 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e73d3d1846ce12b1e223e612b43b59e74ea620978e1c29c015553d8cba22914e +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..821130ae8dbd93c8138a10c7b2237e765e96163f --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39869802017f614a5943845866a541f3e62c2bdf9a3ee258e2e4062006ebee0d +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11fe9585edf1ce8938e59ebc637d235a8dc59519 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23cbbc6ca49a187eb1197209dbe177dc28a9a7d5e81539fcffdff242e704bbb5 +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd0f6e550d78106dfdff614e159220163c142df1 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfd9d1c24b2150a9eca960bc56d7a10614c23cd180285a9859fe90a9ce730705 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4633b75f5573c3a100ff294285e79d2c0d25a80b --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7819ea50a1d025727fa785ee8255a0c07be2fc395b44911f264c20f90d075ec +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ecb0586d94740b8f5f462128c8dae3f804a7482 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34de8744896a076735a165c155b9118e58990663a4bd71a4c940a15acbbd7d3e +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38f3822ca99e443c01e00b78020031025d47f1be --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba6c6da7194ce150f8f8ce902485b835f62ac9afb47b81a9848b765fdba74f25 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53e2137c63dde6415759369f139acb2a24d60d8c --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dd21989111fb07aa50f5d73ee5ba1c40e959f430f00f84e2ad9b59fbb89991a +size 131677869 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f32f08f2383f5340c498942ab7f6fde154711fb --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a35827b5f1b420148d0bea4ec1025c76a8e7db0e6682013353f34eeb448d639 +size 131677869 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ee6d75f573ac25f3f3a5bc7e5ebf692ccff5296 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d65725a10896223c3bdc3b3a26026eb55784cfdc5b21b635e7c7efa298a7a9f8 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ec6c5271022aa795321a10749c6f300832c58dc --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd97719709080723bf7809263fe104d72fe8c0578aafd56d42a74aefce60336e +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00e04d5675e4134e4f3dff3c2d6419e7878fe60d --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2b2cf7afd8160774c9b7939936f7c7b0021b17a8a92c19b13744a61995ec346 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76f127a6de2b360196659d132561cdab70dbff7f --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f21dc330abf49551a1375402a00ce4b84337d99d959c4fe1b3f757b20e0416e2 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b22f21e62e77851b2fb20bba4ec24e1542f39c34 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b98946dad08d90808eed55ea19f0bb92aa97d740f3b11926b8989651bbc608ef +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5e724d6a2058e55592dd1479bbc1ffd97773614 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:273bfa809babb6c77450cbde6fbedfe9b960a2dce9e6c56f60f59d5c960e35ae +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8be425fa20f034f28b50104f9366b9bd9a2b057a --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba0cce2a827155f681ee270dcf4ea43c34f2d024f97b079a6208fc423e31051d +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0932a16eb6fa5838fb19674e3afc1bdb7e1d428 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9deb4b65db020a931b5f1d0d208b9d32619a85d4d30576d245421ef6387862a4 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..352ff6e5d6c564c4af5b2d9071706199ac0c6434 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffc2217eb0a601491b6f924fab154b7582dc57612f019bbad6c562f6a4d374be +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..043175d518dbeaa3ac77396476b0c7bfe31f35c8 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7e930a9b763d8a2a1479254464e2a12062c874185a097689624f28c06251b5d +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d05889be1d45c9b3f01872bf1ae7907dbc475bc --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93617c29701a072d301e70f40cbb3b69c402258ddd5764764bace7602d3e370c +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6d10879570c08caff83a111d11e7e16350ddaad --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:811580e9d48f7bc0881b930d100a3cfb1a04225b6700b413f1bcf2897a0299c1 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37b3e761844295c276c11b47c53e2da196ab3f04 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e9f5369f805456e7faf61869e87849d6e2d201d419ec0fdd9d08ace2d09ee0f +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc9afd06997d396c1d32b58d653ba2ffd3a749f3 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70dd245d429799e8a2627b03815dd0f90630cd327452f67dd991d25e41a4bca5 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..936a1f69536d53b035476f65cd952c5582d1fb12 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31d1d31e4810fff9a49cd6fd14a47364bc1c3fdf4ef0e16015301b9633458c79 +size 131677869 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..918f95a09d710a2e4461ea898e594e1c6dfa3aa5 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baf9862d07cde7ab974f8e2ab1f67fbbf70f4a1176b4aa15c4fdbf2ba8d17e57 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b649d981883b5ea1211dca2024e4cb9e1bee660f --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:002f6180dbeaac708ac4fc6449613c9c36f6884282f9df2f82b5792dde47a74b +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..504bd9b50521b561019c77b3dfe71a2cf587bdaa --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4408e2c3e62805e4f9262df600599bbcf78359a19019b2aed3f1d49e4146ba53 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..286c422965302ebc3a8222821895d658eea56670 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f728909264cbd6b1171a5f883eb84e6a9297eecc4717abaf47767f3b4789752c +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e83895f097e32f184bc09e57a3205f0790dfa3bb --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8f403a2d315c32eb70ffdb4175ba73d8f9e8854f96d4fee06ba05dbfc06a2a0 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44bb38b09e511257ff7bd06c2dedee389edb0305 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f201c11dcbee46a7c73d759e6c73b0235d33dc962234ecde0f204f1d736fc2f5 +size 131677869 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..392052666970ad103e58f575c91da7892fa3e731 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d51ce7c92b0207109f455caad3b98b5ca43a9bd4d293a012bfab03ad781d99f +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..abf1fd610b0fb6eb4beb3fcc15aead107dccb81d --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93b1f926ff93ceba305390b003ccc903ceff96a8425109f9bbe68825ec7bc39f +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d1e191ebe9da5ec6a5472897fdaca54a758ea37 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c257a22f7a25b475d1a4994c970069b3901dff1ffdf9c21ce00e433e8f8b471 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07b74dd3a5ab35e272d0c2f380f43633c90ed1d9 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbcf79492c2b1330c12f66c22015176693a8ad791164af99610af77e5a9dba1c +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1960ec0ea86d7bb82362a1cc74a39b79a44bd434 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3008032e4033c540ae761465be88f921ef1478a48ee686f1154114e8bded131 +size 131677869 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ad89f0018ceeea715519124c2d48d9c0757ba4f --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2582ed054d10eac860fcfb0b9f6903a5deb221f7225da4fefcbe1391bcd2d5b6 +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c155e3ede1c475ab8df91b70843ce521e532298 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d8a0665a3961b9262422bdbb8c750016e8086a113f905aae8cb6dbb7509c20c +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aba20a4dbda4a5a018ecf3e50e1bc02e6aa030e5 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf99bfca3dbd87da518e994a6db306ac540f6e0c03dfc751adfa00b6be89b70d +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18873db0f2e6a3a1fcac054939ff7ff8ee73e0f3 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8025577f73c5bfd4a2e2fe8db921bb0a7d7879372f1d167974e14bd7889a7843 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbbbe1c1eb0b05c78fbe511b8760ce0f107371f4 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:115cca5a9f426e1166a63719904449705da85c63d6b508cd10ac27203fb137d5 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd176b081069ea4ff188a67d93ef6515ee359e15 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c621d03d02c5299cc9a557d832cb661bf90bbc3b312d0a54e8f05259514c39d +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01bae50e3db9df1258acbab300aaaee29476850d --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cbdc797fb5d9197907566ed4421978da6c9cf236a1336f4b9ab18f3981b2630 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8583df7f7e97fd28150eb29b55f7e880741d2143 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:120340e9b7ad65ad925c3e8b083ec9ad3816b60886a8719e896917e3d1d6fe0e +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2801023533db0892b504a4036058bea1676f2d84 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f17245f89e396a3cc938e8b654401bc5ecf0aa6ff7f6f63dc9ae69dfb1bfc7c5 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89556b7a58b971842fda723fc8a58d2641344fc8 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff37a8cafc526ede7bcea22355f93db07ad468924950736ee33e7a03217cc579 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f39833c43418da8e7245c87de4011bc5e6ae3c0 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c19b3accc6d66f794d30fda6df1af3ad18d6a613267e7fa5cdd1d51f9d3f5b77 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4acf80d8d7e9bb1ad2984a04852514562fabfde9 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2780ee8f486d84072950bfa44d3eed2d66d14e1038da182e0dafce9daa302887 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0fbc39da477efecdf2cb47ae33e98d9b7dfc380 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67357627587b0f1623286da4d4f13086e1eed063aeedca3c55389ca58e7773d7 +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee18bff680a03fb375b707fb68bd23d16fb38c06 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa3bf69f44f38bce173dcf4ae9dc8857bdcb6c2e9a70b97095d897435edfd5b7 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..655621bc3bc00559a22ceb335dd26956fcb95561 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d15e5f2e0a57bf61557f7a8d450a09d5f01b54fb06ba3aed83a6fc8a2bfdd1a3 +size 131677869 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a3e93a2e9c3a4651dcbbb686102e3a1d54bc831 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:035786a9b3fa470c06e15946e78c021dc55fd4732e466596b594a2672b786e35 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ab8e8573fd77a440596a67947e9b4c1ea0800e1 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:308114165e703f1e51d48a1044bea9f99757491dc18d7318168409aa43a81e5b +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df4b906b4ff606171da692cc1c9a51a1c2a3bbf3 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c2a635873a1c86f4a9a9e439115f4ae49b2b59e552001ef9703266ba1f588f4 +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22b5382fdf011d10e81f0bbcfb81f6ddaa5c8a65 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06208dd8662e9cff5f8d7227614d1c622d07996a55872ad041629ffdc7e99b53 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15a080a15bc90d7d04184949d680d6d3fed58137 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1303ceb0a1043dba1b80579f7f6c4376e570b4576838d5ceae13dbd0a5293812 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe02f75af0a6cf040ab0369f69a1fa92e578427d --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a0a6f0bd9e2472159868c93e8482536192da36887fbb030cc151b6cbb498629 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f039e255945be63b3593761e108c2db2e366b0ab --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4778149ba20f9be4f30f48043afd85ff579222c5f3e350017d82531aa6af6673 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09f5405408fa1387252d942217a1ea9b7b5b0a37 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6f4764213e04dbe071b8a29e620b1f8fbb3f55ebb9683143e3e57cbb01dacb0 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..debf6376f1c2ac26223e80d6ffcf0dc4a2ab3c4e --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b04375c11f59b7070aa9c874c983254df41db2e539b2032f339ce0c2478e0a1a +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3042ce0a786cf00ab1863b42922eab8a6c38c733 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49426ecd74b480f74b7a40742bf2cf589c134fae43d21699a7063cde28d9a12a +size 131677858 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..452546df773d69a139f6c17a7e900692560a0364 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a53ae8768c907a2eeef3be86e225f4bf443060e178d14a2a1b29e5677b55810 +size 131677719 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..918778c1bfd9656d00c0348f8e4d1f18beecf4b9 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b7e094764f9951002bcb6605d8d371104e6ed06374554197e56584bdb3f4918 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2d927b8ce8cb1c5574d7b2d6098d4204748cae1 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7262e84710f48037eb520bb77837e76e9e8b80d190198e6b0de4efd90456f208 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40746c19bc582730bcb9213b161b91539f8cd934 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8659b587c657c5b1e1f8c8d759befad99e45bbebc17730640709c76c9d8fa227 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c675d8899498dc55694d5fee9562f814ca7a789 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69d049d334f340dae420e43bd1ed6517ea715b5190faf2dd8cde0d238b648dd7 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1444d66f377b5c3a51535da1ac0152467f586948 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7f213774eecbc4b3c5f84c914ee5a61053d2fce16c057757691c3b77618aa79 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc09705342a0956f2231b75e1ea00372d80b32cd --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0fab726fd1102ea1f23719336c6c650a8a55771b7ede66499e90c01d0091453 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..940636a08b3860098d9b8e2327ef5e10fa549c2c --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1e33f724959e4560353cdf15c42349a4f0891a6d88598d6ae2f4550aad71e1f +size 131677869 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0f9b5fba8f0df61a299e7230939b6b95ecea4b0 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5878b31617c8a3b4581c370b291000b0e31ee1df4824e26e01f1ef27b5751ab2 +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..efdbb1ed677ac766e5f35d90458db5cd980b354d --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54ff2a28539e4df4666ad16dfe8a58567ff8d08928a10b169230384f9657aaff +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c5c552d04caae6309e2b3a0ba6cb78c03f1b0ca --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3fa28fc8477f43acfda4610ad6206bbacd426e134f203633dfd11389e6c5a7f +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..764a0bfe8a5298850619829e2da0b506df954672 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c9e3413b6013900d859666442b67f0475a2f066d2775f3005d010335e303b95 +size 131677666 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10575f0ccc6ac60ffd590508a177989fc12f3a00 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f4f7ed47a6348770f4b8dfe47e385c0c58cf80db2fc993e58c5639706fe314a +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6987bc4c15f51c21f0d733a8a0ace782fccf4624 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f92a0383d7c6cd89020118ab84f2909cc34685f71bcd0c066b5dd7021b91c39 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b1ec2c65fc82c7fa3910082c0ef23b54b98fd83 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ed8632a62272076e06c53e9728e0d27476f75f46c5c830c0ed86dbb792b22c4 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80a18aeff02f3537bc01cd018bfe3dd90a90b8bf --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94ec02b57fe07171cf65471fcc7dc60b215e0713ce9581ecd7a7ce03c00b8362 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d164b328701ff6edb32a16c2306c4d79a9f86f9 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fb4c20817cd910104fb4c9921054f317c22fe5b9e7d06b11d76115f1a059a07 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c85827a59bd4883cae25dfa27157e8ed6abffad4 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0dab69f77d96b4bfef95c78e2cf02a10ce2627560007219a44d0bca7a0255bf +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5bd61a9d13334de548ba9dfda66854884062a1e --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60ce1d44aca732ebd93cf8caa9c18bf0793b6c66eba13009182f4f0720092470 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98ee48af83e14aabe3dd5c713fb8b2e06fc871fd --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1966d9d330108898fcdc7f43403b0752da474c6e0988f68437db7f0bf95c09b +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3edd39ed69d51f9135c3ae29212e6f34d174355 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82b243b776d70c31ecbde04b85ad103ffd2009f28edd77e278fc14e34af6dd16 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89d12891e4df715e88309cfff5c4ee55e30359f1 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9aea055ac476ee25dfe33eab5ac668bc75541f9adee916f93a67b20d8e642f99 +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93061de192928d6f046f551ae30d079a9e881c55 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d7bd20dfee409360a5283700c6a8a8b54a664640bb4f01353ba4fdc7760e889 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e9e7cda30db48e0ad19e79c0e6c01e580302ef0 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2912ae0475516c5cb77afa1943207d499ca9dc7d6739510c18256f1aaccf134 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56a3e9994b5502528ff71311397eda60dbcdf2a0 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07b1a202252a709fe802d7db927eb392526c440f47b55a623cb0b5722cb4dbef +size 131677869 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..545f86e364f13e76956e28ff9ef8c2139627780e --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d66b7f450545efc0b9d8ba1f83f8129983bc077fc8b61574d6667161a468b76 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7dc48be5649dca59c3fea0dd76f3a6e4c991caa --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc88dde6754bc7557c47d3489470b7aa64f8189ad256046c91f9a7706a1364c7 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c49b376ba7994ec6e4a28ce1dc8f105a1e1aaae7 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:561eb4b8c45330ce7179fed9bd9933e62e5ffbb0ce616998ce76394b9dc403b2 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c7edf702e2585e1e11db84feb4e4c0504d14d6f --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1300b45175f2e78e7ff168f58e3484b1c59b9167055e4969b448f31f1da62d52 +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f944b4196e761553667eb6abb9ac12241b8393a3 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:666b2ad2a888cad7897d8ec0f1bdc248f295b969d47ffe64b7592cb3de4ad9f9 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd385a671ae136671bed33f2931642cd82615a9f --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ba0d45bd88ab586de8cd85d7ee0aca9f059150d808090fe489e091448781463 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc175aa65a298c3d282b1d313b5942fab70cc471 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5a990de71b65686e3e3c50c4f6e83b6919ca1557d93fe6b2fada045b1ec1e11 +size 131677869 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c3d3b30677cb187066cecce38bd99114f2bbe18 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2180d36e881b2e21b1d28d7792c3b40f6a65ba337607da44ee4336dfad045306 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4733e9fc811a5d5271578f7c05f0e6cfbb58e40c --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e1891d72d3b36f7da4c0c799a326a0c871d7bbcdbdc0633ace3a47c1117168a +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d1efcfefc12fade2f6c0d35244cd6a9ee790165 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:278021c2a24ebbd43670178919e8729ceec992dcb596d409e5f4f90766dc66e7 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8e037050c359d326d9b12f5789fd7bb9ec739f1 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c940d9020e5ab10f9114bde4aaf9bcde497683a7954351edd6dc599b82dd7e8 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d8c4eddf2b81f5a7f01b66c1bfb76b73bd73cc3 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e96f04c3df3039a7c425cb3469f68f027540dec3bc0734c45dcdcc3abe3f66d7 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33b3edb8b328fa12722adf59f6ac55ac2bca0dcb --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b27543d948465661ddfeff42c050d59ea2c9c4f58a222816460196076635104a +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fe82551d915a44db62ed6b57ba7c9631f78c5db --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f187904a2abe58cdb95dd755fe6e0013ba32a02c6f9f6151955fab2e75981803 +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbf7b94378340782086a415ef32e995676b69f6d --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa7a9cdfad63322ee01d31b68517ab77d1be18bf25ca2dac4a41d39b20866e1b +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2b2ea7c43c6915bd72c5f7634115e8a3e1db952 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:391dade29a90d332c81dd663006b56f48664359ef23eafc7311c8f32c941ca1b +size 131677933 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb52fea940bd8b9c1c6ce32c8a141214b11506e8 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:920e677ab4c003b92ec96b6145d9d6198507759ef0befd5f03246a42e569ad0a +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1a346d2894cc9369bba90238de948d2b5838135 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fc5f3168cb649567e98ae46fd9858a7d5fbbcb35f86e5554298d4fa6949a177 +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3db40db13176dff5dcd218a4f58dd30841dc5a56 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:429e8119bd88ab37094fed408000e827018e2435f057d4b46c42dc3c06d99f06 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..407a28cd5bc2ca5cd42bf9aff966e5a4eb144c9f --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b704eb90e60fdcf6fbad20b35f900644a58843e5fd4cf55ec5c50900d96537e +size 131677922 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a33d17f4f61ef614a1b18289c3e1830a6687a2e1 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:083b0b7b4bee13ccfbdafa5b335a3dc1bfd0967c73b5dce35b10623b254408ef +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4ae5269dca09c4e2e7ca2e25a344ebea36ce45c --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c87769e35835e96b87cdb1002377c1bdea7340477f54a0cab13f5b2cea4296a +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd617c1de96ab75b8c99b0cba4839ba67ede4148 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bd9957c32bb5720abba5a5cd73b01d64764a8dcf6d2ea85970d4475732be964 +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b898aa36d54db4ca157619e2ec69987fdc5809d --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc849becc2449ad706a12002966039302b29d67ddb0d306220c7b96af28cac0b +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d86826446690ff53ec798a4c0dabf1fe723f1018 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:561950bedbb869a36a8c67ec23cb0423027bbc98ba06df26e3bbfc802fc866ae +size 131677805 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a1265f84b699467f3817c9d405deca52bfd77ad --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e7a8b9e9738cc54d2862c60cc0d72a419e8a0a0614b5b797a1aad9f13eaad52 +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf4eb252148067e4a0c3a6f4fbec821819ef999d --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:150ed81018b3dcd7126e545b3bcc08b27bd7cfc4464ba9d74996e1daaad89162 +size 131677869 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5252f1de46cacec4461205a503f953f1b476bc47 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d82984436967bab101bf7e0555cf972c9b86fd14ececf453dddc8ded270f11b7 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ff967210401cb0571e59e86dc2845604ac04b89 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07358aae7d0f9ebe87a03a24e03e2784e87c1ad72ea535f63645eecbba841d46 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..614dfd764952ba6f5bc4fde9a27507e68744deb8 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef5d9c8827f1d96aee41c93be2f89d565389331d442eccbc6f322b2d60a49e8f +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37a16f7dcee1edba12026c55c4a980d5dec6bb24 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15742d5acaf7c2412a0f245b887c7711f193e4cdc8fc281708e966fb3a0fb35a +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3b47a46845eeafb3229288560302e6431169a29 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00ca4bf194244c7789259c6d7221a855721a4f750ea35c71bfbe860e9c952033 +size 131677869 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..249b5c27cce3555b02b0f0c3bb289d30f9d3fbff --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b490bffe8e011997b867964f84ef7f3586d0d3e2e0dfc120477b66331b22688e +size 131677869 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfe40b17e069ec599905b4419734c8e8bbfcf831 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:360916c4e55b9ceefdc8e1b3efaeb966c6a3b8ac5bc498f195a28e47717ee66b +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60f9535cae95f2f204ad09ac1d7f8a732e9adc06 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4b3543585b089f3f689966cef384d0461734589db6daf9609448fd0fc445cfa +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d419ac7a5213c01366a734744974887a99a8752a --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ceb5e29617fe1e5c542304db0aa058bea484fc42f7d7954c47fc1e6eb7fbfa33 +size 131677741 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c26f7a8eddad44f2134a2b0bee6b32a9f88bdf3 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:298e3b58b1295e2b6b3f3c5d89e1059722080d56ab7a6ce5137d0de1c38c3406 +size 131677677 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa332e688d1c4647f28fb55792897a489152b8b7 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1758c3afbe2ee529376f3727d23a7f43a39c623e87fdf220c4bc3c91719ad75 +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13b0342bc138132ca84fed71fcb5bb9b5cb0624f --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bffa356dcb5305599f0d0b5fd082904ee9569beef8f8f754c925910d717b4c58 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cd4bd6eee12aa499b5eb371c52c0fb00cd500ba --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2729aeb8bc2838cf9edc6fd15adea2390fdd0ed278f559f833b28b004009c1f +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f8c7e83bf23d3a3a4ab2691e4da3abc100c0945 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22d19fd91078fe266fa1d1fc318ff2d8d59d851ed6cf9331eb956a96962afc60 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77cc5660f9c92b54fda527617613b694c456f1b3 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30dde26f443648da55adf8df8b5fab40e8bc7b2e9746fb5339249bdaab82ccff +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..283df0d00806bef8d191bb703c23bc6f564e47e6 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4a6ff29418f15835f89a09e5fbe66069c70ac8bbdc83716bc643167bb84df95 +size 131677719 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a385c7c1992d7feddbc993d3a83780c1812898ae --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:733a711f33c4d47a6929e9a0a51a5f5ac66a940df1973c3244caeb7b94e1538f +size 131677666 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..430540f9b31864bd0b901dd1e076289c3d2fcc77 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:222f0768963f7ea89d46d5eeb42d70b864c394305214b0ac6e79e4bd43d05ba7 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ea0b2b30c6abd05526c733531a8b120511270dc --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f790268f8d6c8f3574f66882fed77346c66f52f3e8120ed060781e65a66e9e9 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51935d83b20a2d5a703c940492b86156c38f04ec --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10e83f5fd758e393fcdd16c94d9633c22f02461681e6e2fdfa5578ab54e1e14f +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f581f619c579d31be2cce43bce0ae260c596efb --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:885e933b54284a5322f4827ade6dcf621aed502bae556d6d44fac626dbb75925 +size 131677858 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb1e098014c771556f06a558f835fda0ff0c5d46 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebfbcd35a3ea42c5c20088cde2458456c773d30e47aa09dd44bec44c8d8250b7 +size 131677666 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3438958ff1fffabf0dbd3a3514dcd7ab8ea2239 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf856c54e4b7236c5d8db766f6dc5fa0ced3ced1a549ae14ac4a13f70e948365 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..662f275ce2fbe0d048e154f296da9b9ec02058a3 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dc83b745fd505cae3fa2a25335071eeb07f21c872b467f61e27938ce91a1a7f +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04e4768e910b6988c609e1483a03d5ff04c9fade --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:835d096d947272cdfc48d1a99ab4eea9b1f872231ad65411ac39d9029988ccaf +size 131677858 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0835089c7807a2db52fb9f3ed08a1a34a328e48 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7c7e07e487a93d33ab2e4634a014901c86b2f7de9885bcd4c30fe8cc6b9040b +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99d892aa50b08eeba2c2d4bc4ee76929d82be6f4 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b54b6983281d19e9a67bd6576d2954567560f79f5f0251797ba998aa89aba2e7 +size 131677719 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86cf2487c97dfbc49e1f7fad1559035b19cdde0b --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f95ff93506f0d69b127a139fefd44c9d83fd80c58f7bcb76b113aad11d556735 +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf6b9f9640eefa67e0c2b58eddd854b203961ed4 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7575992c49867b17c21a7bbc0d79f5686c1e2bfc58f134b2e5107b8fc6afa33f +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02104d4c02d3e5c8d106b9816a56117d55cbbd1e --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99cd01c0471117a6345f3cd63d74a2bc52f71f5cf6fbbbba39df7e9795425d67 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61b50a1eab88488d2dacbc3f88bfa977b0d815cd --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbf1fab0a17f5549c62a11e349b2359aff8b21a698028c6905445b5dcc048405 +size 131677666 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e06c65ab73ce38039439d8d9fb81d88cf073d7e --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b58455e13228b1dc3ccfbfa3c39bacd7fac04c2b7c3b4cea1b67355bc9622856 +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..515859273b80594d4867ac59b83f44a357268656 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d99308cf345ec83dbd713c286f910270d721bbf784189f483138172eec8bc7f3 +size 131677666 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..468be26fcc3aec32af1c7634cea38db67bb879cb --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b85647ad7004805d30de15fce52bf77ea430eb1902799ba50d16a641c0d072dd +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3ca72266a43347a229921047038291cbba8db2a --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c17a623dfd528aa9d21d4288863a9814b5049a78a34cb25df9fbb4e1accb27e0 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a86c1ba7d48b8385c65e14f1ca15cc3e6dc42f6 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0a0ce6e8267865e5d2c830c5dcc184d546f1f1628ce5a825ec92f30669c5152 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63948cda7a649ac5a674ea99d53f4bd44dd90665 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98ccb6d60509f2774d8200f8cd27409819b5d61172aee9347676f88045801a11 +size 131677858 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa18ed94878d4c35f31ca20c3f000ccba5327327 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5e64035f54479e17931786c851372d11c2395ef9929956d150acaf86d81e064 +size 131677847 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68d99b16393fb67bc36f98bceca134579e07799e --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:293cb364fae08443ca4ac4ab0b3c8d548c377b2fd4cbbab05e2871f31990d6f5 +size 131677666 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cac7d0a27f015fbc7b65d57c7cd06faaa989c7b --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9624c0063530af043fa94ddafb22776381caf3b73fa1c5f66ba9dfce04b7760b +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..558e838a8fe2acfc69c7e80d54c8fe96e55a0b40 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c45ae093525d3a693cc657ff99955136da9ed133afa12cb4f8a84b23def91dcc +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c18de6ba717a1e6c36045ef00c929997e072ee9 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bbd52d1b80eed02da90a5ec726740fd4c8db717577e52f8fb51d55231c49095 +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3395d1412bf8aeb55886aa5c34b1772dcba7be24 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcdd99901e6b3014727d51624267261075845da609661dc8be95c2cf9cd9aace +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa828a5c77f0258ed32ba8a62412a500d3f4ff89 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a76c9c067b5ba56db9281b870be7226622d06045b2f5bc5fa45040f8add6c2a7 +size 131677858 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..484906238ffebc506ab2b8f5a049a3743e24ceef --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:971783a7905221f19f88934cd4186069c9dbae88ac663efbb1fd0d951d9e3ede +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55bcceaff43005fa61f70dda812a37c324d3df16 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4193ad3d7f2783d2122e902f50f22a3b2cb530fc8c3b4ae181e594234f30f7c6 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5f1671d0b9eeb38dca7a068cbe80b0652dfbcf3 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1258e192060f91605d39d7abeda4fd51e7e92b1f5aea48fee538d0932de792a7 +size 131677666 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6fb6e92a137a88e7f992c6686e9e2c5daabbacd --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ec743549218a45a006654ff5cde409b0b743099eeff6c9d19a30273724c648c +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cd9550cb6f1d1612c12e78a31e5ff6999ac20b4 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0571235e6eee0533c70537f2b2bbd50c894c6d38062e0b440d54d06983e4b244 +size 131677655 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a940b62f27357484fd826cee003ea3fc4161896 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26de51fe5e5befc738876d2363dc5015070faad6493167ec564f8605d96e93d1 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28d00faac06c62381c8aed4df9081928b7af77c0 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22172e520cefe2c97072cbdbb61e1d64c4e8d8876ea9bc81885366b57067d946 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7066ac6edd647e4263ad1e4a70a63f52ca719d1b --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb0fddafc4a9c8830aba16e6c1fa0c272a7e84b607b2776ffb512d03ad68a147 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3a6e74b2cd332d711766d873b8f0abd31e4b163 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7322aa8f36b1061faf2b6cfc350ffffe490376933c2c4aed521943078600ac8a +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16edc349787c8d710d437482df275f4a86bd7ce8 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac0a42d6351d06f7b0bd94420b915ff4ac6ea9b7a5e70c77fcca36fee0497690 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc628929ed52e107c36d2a0b93ef799e173dcf2a --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:689437fd384606b08be60112dd8b2d126da0a385cb0ca35c5c0d25faf1b4b898 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..923aa03edda76b5e91e43ae0da30f249eaf78c44 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38741805226a8870e5e5af447376718b42aa167b6a11b33d9739cf1d6c9f273a +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e29a2ad456c48cb552f541f3ac7495abd74fb9d --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d82752395cdc3264faa565ed88a14457995356f83fe8afc2fb6665c21e9faab +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c258a2a6ee1d53403ac7f99f524c95d4dbf5bef9 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:983753596ad2304629c856692a86220eab881c1418e2ee8f3ba4456b3018629e +size 131677858 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcebe9635cf77a5d9a24b40f847d81eeeade5f91 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf08f43c6368d27be105b4c01e085889bfd21c7b00ddd865219591c0df1f2aea +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da78294f684174101d7104dc52bbd00f68b7811c --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebf4833629fbc32ddba1dc03f07a69c2c375768c94aa230c07a87654ca583db3 +size 131677719 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1312ce90c667b50c81d5a66e00e3f1f5e2b58e65 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:080abd974e8c4693ffcdb97f4b68c304f721ecf81759badefdfd43208bbbcee6 +size 131677858 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dcf58d65f6dba5eb2923da807efe690557b983a --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:977fe5e21a08e75021efba357c8d92f5231524c5c8bba9a0e1db9e7cbaea5dae +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59ceafdebe47f67c131c6022ba572324be8cd314 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9d0b3e78fdca60b892521e8d4898dd3ea16c9306dd09c889a48936f8b33adfe +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0f2ca7269effdf272c73bc0e7cf77681084151f --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b14a403c27e1db99615e78e0e64ca11de3fdb5b6953c562a932c8d747f6a5a4 +size 131677666 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a07d7daeb3eb89b5be0284d27822ec15d1ee50e --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21fe0d4febfe8688dd447db04406ab26238c0f55d9045b007ca53bb223565318 +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bb924f3b35bca48aa02b5ada520e3dcf4390f0d --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e09bdc87eb191e762146504a11c4548c902b56b2c4413219c175759369ded2ef +size 131677666 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c63bda9767e26e56312f019822b7bcbb373cf32 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:762bdf812e2a3adae556dd83c566871ab5fb0105d23dc19c9b10ab5f66318d75 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..383a94a66282f9c6d6abadd7a9c1de8ca2356bf5 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ca825f6d4f6e0435b885ee8a3de44ffc2afe15f87fe8edcc34199de58a74225 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87d6e9ebe6ea0b45e3307447e87df9761620c0f4 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f17d74f058c3ad22991bc6e674286fd7a96c425bccdc56b877c4293d64cab1f +size 131677858 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5cb388a420245c4874afe68a7f72773b1a60bdd --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44fec42cfc5a2131dc889fa7cc1351ce3f154e0f92ce7109068210b27d7b1cf7 +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d014da27da1c41135d0a77ccd45e1dd12a42a8f4 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db90c9211a2dbb9682f5eb96197432502af864bef0bae46387c17cd1a65295f4 +size 131677719 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c63bc22a153e29d7a558e85e94e8d0e9e3595807 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e975fb47479e4416ebe915a0bc84065e2ade7f541c4b541aded9e7eb3453426 +size 131677666 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aed4334639f49699a792f4102d3c1bf68841156a --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02ee63cbd631a425ed910bc19d17a6e8126f376b244282c53c80429372aecedd +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7faa24bce63e07f59ffa1d8d5c7f9454d18a1aa --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b3ca677279e87a7cd4792f2be72d8c67a9faba214e98fdecda09cab4787cb18 +size 131677858 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..450447e567deaeeb4a203129d05a51bc9839b501 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5d7685b4b907dfca49eeac3ca3f528723f5d029470e65efeb12be103283c641 +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b5b820982f71f0f2770a1cce546871c6e9a2ffc --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c419e6db2d60438c7c7ec5e9bdcc891bf3253d1a908a582f47adc635b240e70c +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4995bb3b49b0fb0ca8537d20bae5c4f14de5c52e --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e5f425ac835303ffb1ea5681acf653dbbc65409d2812616423c6a61eabf40bd +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f4f62518aac21cd6c412bd7ab3e3e1ad60a7eaa --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a4d0ed010b480988f2d99dae37a472a7f96577ddaf5abdbfaf86990438052ac +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e572764a5dd8d72859a564640604159078b1b9f --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fae575fe230ae1b5541c0da150154598771fcbe0afea4677a9bc5a33c0001bb2 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06eb4da32eaa5d076ba077c477ebf8e2dafa25bf --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b729f36fe816328f6c7d8bdb7489b57b03b008ad71745238b62d93fd23d8fe3a +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df73c45b8814a15d81c8b2a1a082c6fa34dd4da3 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cc03f200e4e4cab97f4e0eeb41dcf1ec30ae0f31fb10b2c398a196f2dadcac9 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be70efc8c4c2a0c27b6194f6128d2b2285fc0a22 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ce4591b5e1d8f749dbcd173f51629e7c12d9a8cd81fbdffc0655312ed82f315 +size 131677847 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c0fd906cacdc0924015e6eb07f110649250eee3 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f156ddd3d2f828255ecde8e3bb7db52da634d917c93650aa1e2842f22ca6a6f +size 131677666 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68e0a5e7f457303af6f06276adbdf7491977f882 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37ee576231ff6bc89ca113ff6ae19c2ce6994308e657baefd5ceedc7612a7c75 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5070d8aac492d55a999b90f577e214faf5e25036 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0ad8180c832dd3b6833431311038f2cdef147ca94c49052febbdf25b36013de +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e6d165cbbf3ae2499238f15afddfc518c079c89 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb0391fb5a4cbcce2f163fa775a1d51debce14a92fe3fa32baf17a58dde16381 +size 131677922 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa82b5727686b2aa3371db326ee4496bab3c148f --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88d357c63adf722fd5bf5507d9062d72945766755fdf371b49c6e51144327ff3 +size 131677730 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d698377f9e93483880c99d2c31b22e1372d0118 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b53283f31ec32149080ced91548e466de9b124cacb15b3dc7d69ab0f300ed35 +size 131677666 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b325ce6dddb69061a94641a7464db85440ef647c --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c37c646737de93449fae6b00429790b289d72c5f0220d4b16c5304c2d241b290 +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a58604a1c718ba39bc53ea8a9b1189f330802a9 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df29123eb60971fbf8376f590ec68be4c8ba056bd8c552ad50a508338f4aca8b +size 131677794 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aee7a0f241cbd362e06593bd631433b1cae3239e --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca2d7e0ef43e8c6949b17bd2430673c821dda2765c267a968778e5012a6e050e +size 131677858 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ae5770a5dd972a713f28c300f6a74a70e48ff73 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8e67ca874803cfed56c62025fe30e40918bdcc98d4d3995373caaa5fdb3df26 +size 131677666 diff --git a/perplexity25/global_step52452/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/perplexity25/global_step52452/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ec2c37349ef473508365fe642a9ed58526f5871 --- /dev/null +++ b/perplexity25/global_step52452/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:160302c220200a0cafb1b7327fa22fff70800afa2c8d962c264d5d3512afeb9b +size 131677719 diff --git a/perplexity25/global_step52452/layer_01-model_00-model_states.pt b/perplexity25/global_step52452/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00e4df32ae8c64288b9cb4f153a11129c9df443a --- /dev/null +++ b/perplexity25/global_step52452/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fafd1f9bffe1c8d1c8392f038279b0388dbfa8a46cd4b86b76bb0a4455e8fb9 +size 268043523 diff --git a/perplexity25/global_step52452/layer_03-model_00-model_states.pt b/perplexity25/global_step52452/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bfad1ea6767ff3802c7c4e1b1421d8d85825436 --- /dev/null +++ b/perplexity25/global_step52452/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97c3818edbb2af4d773a550c11e406e2091768012b8a035a55c90411d80823ea +size 157357315 diff --git a/perplexity25/global_step52452/layer_04-model_00-model_states.pt b/perplexity25/global_step52452/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9820459cca13c3f062d6f4e427a67bed06f5e55f --- /dev/null +++ b/perplexity25/global_step52452/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:021664eb72161a5c2465087c8cd14d95f103924cd9de5a8e0f248e05847861d2 +size 157357315 diff --git a/perplexity25/global_step52452/layer_05-model_00-model_states.pt b/perplexity25/global_step52452/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a3f9f07acac63fc20ae5630cac67394b636f66b --- /dev/null +++ b/perplexity25/global_step52452/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b213c74316d614eaf8f609d581db3d72d391de072e86f2c988d718125de9887c +size 157357315 diff --git a/perplexity25/global_step52452/layer_06-model_00-model_states.pt b/perplexity25/global_step52452/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce74ad54bafca971ebef400dc392abb4a23ded9f --- /dev/null +++ b/perplexity25/global_step52452/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:143a1a408ddd7d35b99173ce609cd4ad89521a18ce79a37581a2823d04300a29 +size 157357315 diff --git a/perplexity25/global_step52452/layer_07-model_00-model_states.pt b/perplexity25/global_step52452/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aba31b8f0974b0cadb7840eb3449ea1c56e7a5c7 --- /dev/null +++ b/perplexity25/global_step52452/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46212cc214fda2f2da28726718f929c2bc6c1e554894e5068fbd5c844c08b0f0 +size 157357315 diff --git a/perplexity25/global_step52452/layer_08-model_00-model_states.pt b/perplexity25/global_step52452/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f92c4c716d0e9f3ff102f2ac4db40b696800f186 --- /dev/null +++ b/perplexity25/global_step52452/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d68acaf6a7e50cb47b15c8672a56a6439dc7448f97db9c4aec52b05f60db6d0 +size 157357315 diff --git a/perplexity25/global_step52452/layer_09-model_00-model_states.pt b/perplexity25/global_step52452/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd68178150552fb3cd3ec196638a028082834092 --- /dev/null +++ b/perplexity25/global_step52452/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe32d41a3d4440c5c8aeac3804f06428f8e5dbc5755f3c1bd6e60647c679c1ab +size 157357315 diff --git a/perplexity25/global_step52452/layer_10-model_00-model_states.pt b/perplexity25/global_step52452/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11aa50040c73a8279475a7f3a9c94b5617e06ae9 --- /dev/null +++ b/perplexity25/global_step52452/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e5359e373d7471f6871751cba105b6df5266bbd6226513aa1cf2b84dd750bc2 +size 157357315 diff --git a/perplexity25/global_step52452/layer_11-model_00-model_states.pt b/perplexity25/global_step52452/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93fa17838b61ae6e96508bbad76a2ef3f6e34a91 --- /dev/null +++ b/perplexity25/global_step52452/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cdb08e33ec652ef182da3643220dd036f34a9873e52bde3d6058458fddecf8e +size 157357315 diff --git a/perplexity25/global_step52452/layer_12-model_00-model_states.pt b/perplexity25/global_step52452/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1190586bd94945edf0707e61ad92ac92d3c34dee --- /dev/null +++ b/perplexity25/global_step52452/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f1788c954521aa0006e2fd9ab17649488aae27b6d0b72fcc6634f7518fbb2e4 +size 157357315 diff --git a/perplexity25/global_step52452/layer_13-model_00-model_states.pt b/perplexity25/global_step52452/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4278e2da78a88bcda81f1681584b1b1f5e89a848 --- /dev/null +++ b/perplexity25/global_step52452/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:819b454c61c3cc61f4f16efcf39eaefbc6cea467510424c873767dc2616a4362 +size 157357315 diff --git a/perplexity25/global_step52452/layer_14-model_00-model_states.pt b/perplexity25/global_step52452/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84d90cc6b10203e7fcb78e505aede3d2a1f3f250 --- /dev/null +++ b/perplexity25/global_step52452/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6ec62525ed65c875a2932c961f4e6e5e9293f9b6b91869e174ced7195476476 +size 157357315 diff --git a/perplexity25/global_step52452/layer_15-model_00-model_states.pt b/perplexity25/global_step52452/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..166b84ab1e79bb08ee33812f952844eefcc5a797 --- /dev/null +++ b/perplexity25/global_step52452/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faa9a6c07ed834b9b61a2e4db8569867c301d1f72b327b53448495179f3e5cdf +size 157357315 diff --git a/perplexity25/global_step52452/layer_16-model_00-model_states.pt b/perplexity25/global_step52452/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ee7821685d16c1f41cd8e7dc6abcb2b347d46a2 --- /dev/null +++ b/perplexity25/global_step52452/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:022c4856595eaf99d56adb970930a443b7f666a8464e4d2f657fd29bb600b22d +size 157357315 diff --git a/perplexity25/global_step52452/layer_17-model_00-model_states.pt b/perplexity25/global_step52452/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89c6fca2522a6221ae9b6e88a4bb4cfeaf132e9a --- /dev/null +++ b/perplexity25/global_step52452/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:062774767bfe58d8494b989d60d36fa8bce5abb983390c241ef9130d1cab795e +size 157357315 diff --git a/perplexity25/global_step52452/layer_18-model_00-model_states.pt b/perplexity25/global_step52452/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cb7bc04963de15d2bfdf4df978c61bdb117f672 --- /dev/null +++ b/perplexity25/global_step52452/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58bea371e80915a1d772ea02aa9046b7cc6bbfecf396b13727213d6bfabe28b1 +size 157357315 diff --git a/perplexity25/global_step52452/layer_19-model_00-model_states.pt b/perplexity25/global_step52452/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..abf3d3c355d68c65c85cc50ce65418cbfabf9d16 --- /dev/null +++ b/perplexity25/global_step52452/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06f7385470489b1bf9868796b3942f6c85d91cf9288d02e5e997d55b273b7925 +size 157357315 diff --git a/perplexity25/global_step52452/layer_20-model_00-model_states.pt b/perplexity25/global_step52452/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..648f16829953cf9ca8a565db05739752418a671a --- /dev/null +++ b/perplexity25/global_step52452/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4a24f3498b3f77d74c42f2a49b8bc0e71bed047c01c1a437a7a4f23bc9665e6 +size 157357315 diff --git a/perplexity25/global_step52452/layer_21-model_00-model_states.pt b/perplexity25/global_step52452/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8955b9399b83c861bc297a558f5ecabdcb9bdb5c --- /dev/null +++ b/perplexity25/global_step52452/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a2cc411208bdebac4e4dc6319389c368619ddb2bad69d1e8edefee44792d5e6 +size 157357315 diff --git a/perplexity25/global_step52452/layer_22-model_00-model_states.pt b/perplexity25/global_step52452/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c25e1b931779969282e86dfd0b6353567982cc6b --- /dev/null +++ b/perplexity25/global_step52452/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d7e5861789a11672cb7d369ff8713129de9704d63f2d9bd0daf12786dc22706 +size 157357315 diff --git a/perplexity25/global_step52452/layer_23-model_00-model_states.pt b/perplexity25/global_step52452/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20bdb7e2d259afa2ea8290536b54138b1e019e91 --- /dev/null +++ b/perplexity25/global_step52452/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c92bbccfa829b04e80e67c3cb95a9663945655bd4911678bc1eb24745e978e2a +size 157357315 diff --git a/perplexity25/global_step52452/layer_24-model_00-model_states.pt b/perplexity25/global_step52452/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29a2770aac063951c7949430fdc3911df26035be --- /dev/null +++ b/perplexity25/global_step52452/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8199b8a19b3b17dbc0ae1ddc0703969561bb6bdb3a921409435c84a1be03bba +size 157357315 diff --git a/perplexity25/global_step52452/layer_25-model_00-model_states.pt b/perplexity25/global_step52452/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5900fdfc5de07ce712ad5ef4124188dbac66e882 --- /dev/null +++ b/perplexity25/global_step52452/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4345f8b951fdfe2828b49b7327dcafab759be6d01a8c21e9cd2a512ebdafb7a5 +size 157357315 diff --git a/perplexity25/global_step52452/layer_26-model_00-model_states.pt b/perplexity25/global_step52452/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e1edc2a0b3e928298e479a90056aff677e64763 --- /dev/null +++ b/perplexity25/global_step52452/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bed9afe1c4b4a5843a81dd8cf2216fa6303012db52f981afd9e39b495225eef6 +size 157357315 diff --git a/perplexity25/global_step52452/layer_27-model_00-model_states.pt b/perplexity25/global_step52452/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c27e79098f8ab585c4a2f9b639bf14a93063b2af --- /dev/null +++ b/perplexity25/global_step52452/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc93bd898381a63f544ab36314c86dc8658ea45f6f331f7e592635f76863a22d +size 157357315 diff --git a/perplexity25/global_step52452/layer_28-model_00-model_states.pt b/perplexity25/global_step52452/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4df3cc9a21f1b4c7363a4f2c8d160372a1f43f40 --- /dev/null +++ b/perplexity25/global_step52452/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8459ad9506acab48923110a321119f47d949c91c6494844df5de074ef57a767d +size 157357315 diff --git a/perplexity25/global_step52452/layer_29-model_00-model_states.pt b/perplexity25/global_step52452/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50faebf684b5bf60f0a7ac8aabb0384817e7d247 --- /dev/null +++ b/perplexity25/global_step52452/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:033627f2201452b67bb8bf82ea39c583a72b526665b9ea657cad1390dfa102e1 +size 157357315 diff --git a/perplexity25/global_step52452/layer_30-model_00-model_states.pt b/perplexity25/global_step52452/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e04e76a17ce662118eac48b1ef871b1b05de416 --- /dev/null +++ b/perplexity25/global_step52452/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0533f1c755a3b98550b33b906960fdcbd2fc60ea818b682aa40daa2f93bdf3d9 +size 157357315 diff --git a/perplexity25/global_step52452/layer_31-model_00-model_states.pt b/perplexity25/global_step52452/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d3c201adfe27447e348ee645376e4500ed9ac01 --- /dev/null +++ b/perplexity25/global_step52452/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e3286956f7c85df318ed38f2facab805942861d03feaeb065b49c0b46d3848f +size 157357315 diff --git a/perplexity25/global_step52452/layer_32-model_00-model_states.pt b/perplexity25/global_step52452/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e72777fb94410246d8acb5a62f66a01d616e442 --- /dev/null +++ b/perplexity25/global_step52452/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17d0eb38ee859ac92e44e082a7ababca36e3dbd32c08e71aa396596348539cfa +size 157357315 diff --git a/perplexity25/global_step52452/layer_33-model_00-model_states.pt b/perplexity25/global_step52452/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f1172efb4cbfd7707a32bf8074272c0335fbb48 --- /dev/null +++ b/perplexity25/global_step52452/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c3b3efad498b831c4e33f311ff4986f929fdaef16337edf6c7a128fa50ebacd +size 157357315 diff --git a/perplexity25/global_step52452/layer_34-model_00-model_states.pt b/perplexity25/global_step52452/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3aadc62eaed866f5e4bae9cab86d80fdd63e6d3 --- /dev/null +++ b/perplexity25/global_step52452/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ae8e2d2c329468f562e3f6104b404ef8c5b1f6873c19110bd02df90284edbeb +size 157357315 diff --git a/perplexity25/global_step52452/layer_35-model_00-model_states.pt b/perplexity25/global_step52452/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7b2767befceee71932e820f04bc342598adccdf --- /dev/null +++ b/perplexity25/global_step52452/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ff5625a26f58160bfa2de2de6fbf261c821841b0b0ecf76c547104e269776df +size 157357315 diff --git a/perplexity25/global_step52452/layer_36-model_00-model_states.pt b/perplexity25/global_step52452/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..753e904debbdb50ba08801c89828fbb09cf6a37c --- /dev/null +++ b/perplexity25/global_step52452/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c44c9e8bab6e656cf079f7773e994387cf7265d7c52e9f471ee5886193c6d088 +size 157357315 diff --git a/perplexity25/global_step52452/layer_38-model_00-model_states.pt b/perplexity25/global_step52452/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45c06d98d070ef0f39711c50457e2ccb1fb75a8e --- /dev/null +++ b/perplexity25/global_step52452/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:925e4f99b6dddc285e636cc194f88bbeb65f625ce01159f98b97e955aacd7198 +size 11459 diff --git a/perplexity25/global_step52452/mp_rank_00_model_states.pt b/perplexity25/global_step52452/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a79dd914133ad73f5622349dcbb1d193b57abcf6 --- /dev/null +++ b/perplexity25/global_step52452/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd79fc3c77bc38f6c9342abc1851fd58f57216225051dd7e0bc3ad10de0b7ffd +size 49971 diff --git a/perplexity25/sbatch_2b855boscarperplexity25.sh b/perplexity25/sbatch_2b855boscarperplexity25.sh new file mode 100644 index 0000000000000000000000000000000000000000..868b2c868e5de24bea7457af2f0002e2ae3f5605 --- /dev/null +++ b/perplexity25/sbatch_2b855boscarperplexity25.sh @@ -0,0 +1,165 @@ +#!/bin/bash +#SBATCH --exclude=nid007571,nid007112,nid006774,nid007502,nid007506,nid007507,nid005145,nid006692,nid007218,nid007123,nid006124,nid006123,nid007496,nid007237,nid006852,nid007206,nid006947,nid007212,nid006977,nid007222,nid005444,nid007219,nid007493,nid007221,nid005300,nid005619,nid006118,nid005203,nid006113,nid006481,nid007077,nid005208,nid005207,nid005879,nid005901 +#SBATCH --nodes=32 +#SBATCH --ntasks-per-node=1 +#SBATCH --cpus-per-task=32 +#SBATCH --mem=256G +#SBATCH -p standard-g +#SBATCH -t 48:00:00 +#SBATCH --gpus-per-node=mi250:8 +#SBATCH --exclusive=user +#SBATCH --hint=nomultithread +#SBATCH --account=project_462000119 +#SBATCH -o logs/%j.out +#SBATCH -e logs/%j.err + +VARIANT=2b855b55boscarperplexity25 + +# if run without sbatch, invoke here +if [ -z $SLURM_JOB_ID ]; then + mkdir -p logs + sbatch "$0" + exit +fi + +set -euo pipefail + +# symlink logs/latest.out and logs/latest.err +ln -f -s $SLURM_JOB_ID.out logs/latest.out +ln -f -s $SLURM_JOB_ID.err logs/latest.err + +KILL_SWITCH_PATH=kill-switch-$VARIANT +CHECKPOINT_PATH=checkpoints_$VARIANT +TENSORBOARD_PATH=tensorboard_$VARIANT + +# Data +VOCAB_FILE="gpt2/vocab.json" +MERGE_FILE="gpt2/merges.txt" +#TRAIN_DATA_PATH="/scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_10B_text_document" +#VAL_DATA_PATH="/scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document" + +TRAIN_DATA_PATH=trainoscarperplexity25.txt +# "train: 1.0 0:1 /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_55B_text_document" +VALID_DATA_PATH=val.txt +# "validation: 1.0 0:1 /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document" + +PP_SIZE=1 +TP_SIZE=1 + +MICRO_BATCH_SIZE=2 +GRADIENT_ACCUMULATION_STEPS=1 +WORLD_SIZE=$((SLURM_GPUS_ON_NODE*SLURM_JOB_NUM_NODES)) +GLOBAL_BATCH_SIZE=$((MICRO_BATCH_SIZE*WORLD_SIZE*GRADIENT_ACCUMULATION_STEPS)) + +# Model parameters +source model_params.sh +MODEL_PARAM=("${PARAM_2980M[@]}") +NHIDDEN=${MODEL_PARAM[0]} +FFN_HIDDEN_SIZE=${MODEL_PARAM[1]} +KV_SIZE=${MODEL_PARAM[2]} +NHEADS=${MODEL_PARAM[3]} +NLAYERS=${MODEL_PARAM[4]} +SEQ_LEN=2048 + +echo "Model parameters: d_model $NHIDDEN ffw_size $FFN_HIDDEN_SIZE kv_size $KV_SIZE n_heads $NHEADS n_layers $NLAYERS" + +SAVE_INTERVAL=10000 + +# Tokens: 55000000000 +# -> Samples: 26855469 +TRAIN_SAMPLES=26_855_469 + +OPTIMIZER_ARGS=" \ + --optimizer adam \ + --adam-beta1 0.9 \ + --adam-beta2 0.95 \ + --adam-eps 1e-8 \ + --lr 2e-4 \ + --min-lr 2e-5 \ + --lr-decay-style cosine \ + --lr-decay-samples $TRAIN_SAMPLES \ + --lr-warmup-samples 268_555 \ + --clip-grad 1.0 \ + --weight-decay 1e-1 \ + " + +GPT_ARGS=" \ + --num-layers $NLAYERS \ + --hidden-size $NHIDDEN \ + --num-attention-heads $NHEADS \ + --kv-channels $KV_SIZE \ + --ffn-hidden-size $FFN_HIDDEN_SIZE \ + --seq-length $SEQ_LEN \ + --max-position-embeddings $SEQ_LEN \ + --micro-batch-size $MICRO_BATCH_SIZE \ + --global-batch-size $GLOBAL_BATCH_SIZE \ + --train-samples $TRAIN_SAMPLES \ + --vocab-file $VOCAB_FILE \ + --merge-file $MERGE_FILE \ + --clip-grad 1.0 \ + --kill-switch-path $KILL_SWITCH_PATH \ + --bf16 \ + $OPTIMIZER_ARGS \ + " + +OUTPUT_ARGS=" \ + --log-interval 10 \ + --save-interval $SAVE_INTERVAL \ + --eval-interval 100 \ + --eval-iters 100 \ + --tensorboard-dir $TENSORBOARD_PATH \ + --tensorboard-queue-size 5 \ + --log-timers-to-tensorboard \ + --log-batch-size-to-tensorboard \ + --log-validation-ppl-to-tensorboard \ + " + +ZERO_STAGE=0 + +mkdir -p ds_configs +DS_CONFIG_PATH="ds_configs/$SLURM_JOB_ID.json" + +cat < $DS_CONFIG_PATH +{ + "train_micro_batch_size_per_gpu": $MICRO_BATCH_SIZE, + "train_batch_size": $GLOBAL_BATCH_SIZE, + "gradient_clipping": 1.0, + "zero_optimization": { + "stage": $ZERO_STAGE + }, + "bf16": { + "enabled": true + }, + "steps_per_print": 2000, + "wall_clock_breakdown": false +} +EOF + +DEEPSPEED_ARGS=" \ + --deepspeed \ + --deepspeed_config $DS_CONFIG_PATH \ + --zero-stage $ZERO_STAGE \ + " + +CMD=" \ + Megatron-DeepSpeed/pretrain_gpt.py \ + --tensor-model-parallel-size $TP_SIZE \ + --pipeline-model-parallel-size $PP_SIZE \ + $GPT_ARGS \ + $OUTPUT_ARGS \ + --save $CHECKPOINT_PATH \ + --load $CHECKPOINT_PATH \ + --train-weighted-split-paths-path $TRAIN_DATA_PATH \ + --valid-weighted-split-paths-path $VALID_DATA_PATH \ + --data-impl mmap \ + $DEEPSPEED_ARGS \ + " + +echo $CMD + +echo "START $SLURM_JOBID: $(date)" + +# bash launch_srun.sh $CMD +srun --label launch.sh $CMD + +echo "END $SLURM_JOBID: $(date)" diff --git a/perplexity25/tensorboard_2b855b55boscarperplexity25/events.out.tfevents.1683717416.nid007109.105173.0 b/perplexity25/tensorboard_2b855b55boscarperplexity25/events.out.tfevents.1683717416.nid007109.105173.0 new file mode 100644 index 0000000000000000000000000000000000000000..71797ebc058731b69e123e787eee426e80ce01c3 --- /dev/null +++ b/perplexity25/tensorboard_2b855b55boscarperplexity25/events.out.tfevents.1683717416.nid007109.105173.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4875fe45e1ca17c473d772eb2d2bf734cd0709e4362b28d154222dc3cbdc424b +size 94423975 diff --git a/perplexity25/trainoscarperplexity25.txt b/perplexity25/trainoscarperplexity25.txt new file mode 100644 index 0000000000000000000000000000000000000000..274d8f0370a5e92b5a9c6cdc011980c68c6d7411 --- /dev/null +++ b/perplexity25/trainoscarperplexity25.txt @@ -0,0 +1 @@ +"train: 1.0 0:1 /scratch/project_462000119/data/oscarperplexity/gpt2tok_oscar_en_perplexity_25_text_document" diff --git a/perplexity25/transformers/config.json b/perplexity25/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2debb3b510ba26c4e6693cd4c6be848955e93cec --- /dev/null +++ b/perplexity25/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50304, "n_positions": 2048, "n_embd": 2560, "n_layer": 34, "n_head": 20, "n_inner": 10240, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/perplexity25/transformers/pytorch_model.bin b/perplexity25/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..0ed2ffb4057585319156fa522f074375500db411 --- /dev/null +++ b/perplexity25/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e3e042583fb08bc7748c6a49f849f0ba96013c55a2d77546bfe6fe9099b25d2 +size 5903417421