diff --git a/.gitattributes b/.gitattributes index edb80580c59786d0fe658455851d7f2857fc384e..f9bfe618530cb74d2b37f0250be666ec6bdb6ea2 100644 --- a/.gitattributes +++ b/.gitattributes @@ -2646,3 +2646,51 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text 4b284b84boscarv2/evaluation/generation/examples.4b284b84boscarv2_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text 4b284b84boscarv2/evaluation/generation/examples.4b284b84boscarv2_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text 4b284b84boscarv2/evaluation/generation/examples.4b284b84boscarv2_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e057c09aab9d2f64f9848a1e727503e5688a7703 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.3035990566203564, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.025090566187709752}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.071329758776339, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00279942361165936}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2777833537640477, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005021363310584012}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.08651516220636073, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018421075247631034}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.02493593159722908, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0015907952635559632}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.09479553172438937, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0029506060980076265}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.029457430490114032, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010438331217221088}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06175148366384243, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002527555333736909}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2437824603111534, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004509160724470269}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.07406437697939146, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015395345437139562}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06515539016564718, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0025912111251545702}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2540442770643496, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00462671195388165}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.07865092467105374, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016703135405487922}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..ed674ae05fba576aaef46a37c884d10b8dea8eab --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.425747629657599, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.019098717536100474}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07869000641860335, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002574141434973694}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.27911697917731965, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005025828797632534}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09915747457632551, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020735345455021683}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.028711039922457098, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0015895748345510915}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1016349747426781, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003064263260383757}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.03553245669340435, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012297768666432714}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06784822137078164, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0023584286957804}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.24104415879973046, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004392721456408033}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.08430815534591073, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001735358065989058}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07247904169290792, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002450321126322307}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.25603235118880574, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004615086249365793}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.09052335683054723, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00188465696521615}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..22e472a71d49a4912671d7d74164816360d29334 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.4497583704772655, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.020681936257570407}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.08676474022374367, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0030356563200589527}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.28565036099040625, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005160364852348898}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10711351422120703, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024517943039154802}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03205343730461677, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001723196140481487}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.10665226766319001, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0031321051228955267}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.03910067067467762, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014210269756776363}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07292425907812133, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002682288331233897}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2418993456910343, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004387413324828132}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.08897314932870945, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002002929328501285}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07776458484873876, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002744825042381609}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.25905556991925294, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004682330002575584}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.09589616680302177, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021426419270798853}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..824fde23d5dd07425ab50843caa55a0812513c61 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5453566942766312, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03174339868079995}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.09141520582826082, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0030271528036140147}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2946460917400917, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005150457597998139}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11381502730552777, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025266791277412273}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.0349533732864018, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0018089338825247128}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1132672221907378, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0032322633657986535}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.04302598363295129, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015803110546547487}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07724838020684321, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0027324213899579644}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.24881404393817505, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004406171113605123}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09476653245926525, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002130119160105199}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.0833829754674534, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0028479312887177617}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.26789842816421516, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00469224168355405}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10301268965900799, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022888513790911423}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..ea672fdc06f7969e02bc885f881e95e71f50fd1b --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.552842738936437, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.031220316118742313}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0904044344997309, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0028870247747819445}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.30097906504674915, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005237112327131232}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.1125896095390658, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024441626752801536}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03357915742500351, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001563192087212674}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1186975703608361, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0033758949815214734}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.042594714406787165, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014574874865349483}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07544711584950896, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0025299603142831984}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2529660247399177, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00445147947055177}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09294924226115779, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00201851881067649}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.08174948336092744, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0026566402566456145}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2733792203624409, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0047675031230854}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10127472230162189, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002166709168455675}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..609f789d89ae75f28cbdfa592ca52aed67faaf06 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5160808451457419, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.028152585581808363}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.08756298477917958, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002702960483622272}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.30943226003927954, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00537568452081882}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11267246257206415, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023161203363087435}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.031279144513968335, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0015413777797901}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1215282455226915, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003458287142794445}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.04130600915194189, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014050088099057468}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.0727149677685351, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002357535066892359}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.25979581419981984, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004554297207344822}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09293487391814521, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018937867038700312}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07890883384983154, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002452737865418059}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.28252744959181614, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004927414464655944}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10164495184500182, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020419190457151644}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..0c397fc3b9c35ae0a0b9184860ae86dc246f1e21 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.15144825263093634, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001983783278782952}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.22534109695497295, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002481691416374552}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.16612440507868828, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017714330657529222}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.024905925069722477, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006850846534012076}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.03850478234485377, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0011024526272317378}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.027643924254134603, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007121708145651539}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11125836759667614, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00142424299423556}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.17033205247937977, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0019231978134307691}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.12276816133742628, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012192289120582331}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.14179043128628907, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018541893135933546}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.21137913675901987, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0023233022426073892}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.15558334623949294, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016443580462993418}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.159384502447796, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.057628180591426645}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..afebb0fa9a3b7a5ceb6c249ffb51a3705e987f18 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.17371296302390632, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0021902383124749454}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.24147579886101558, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0024751615706129063}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1816842303684298, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017782880793874537}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.03192092546391988, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009424962628309825}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04410602388358206, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0011954069713593922}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03265176701451356, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007878736261592252}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.12465533551452404, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015982129307706894}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.17675811341682113, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0019268394653393782}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13015162278257636, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012020872378512297}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1631041776023868, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020525153232724904}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.22761644537805767, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0023639550060386397}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.17077057715538618, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016691467024742542}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.566708990629026, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0581496436272751}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..b17cd5449d294c49ffea85e92065311d22b36297 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.17743624737565108, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0021492258023722674}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.25150886158134367, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0024524846458276782}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.18745443354388727, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017296949460870405}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.03283000534133716, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009328095980555773}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.045825393377754105, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012602521826330568}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.033509423859662844, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007929018957245757}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.12645353945710797, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015870180893584427}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.18352284038906627, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0019514738060420578}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1336204206295648, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0011901208386536995}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.16653674072514268, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002024987535804069}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.23696286031880665, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002325990094088013}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.17608197313625737, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016179873786064413}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.5566151429887363, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07263045479067322}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..ad722316dafcf99377de7bd5e9ac9a8f1db7d8ff --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.14740810337408072, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002271679945302172}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.20836892569223942, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028639121415319447}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.15441643686495948, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020001231144296736}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.026151374582378446, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007896206739810243}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.037574793035193066, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0011612525965493635}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.02732982658717203, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007317865399481251}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.10492025586641264, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015968039001781839}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.15175102080784733, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021792866520934837}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.10993608037589384, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013690145372151107}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.13823688941444, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002132419884185906}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.1956605692982594, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002692622620180876}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.14475462836497524, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018689106719346205}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.5090266791250284, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06924033448041976}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..59ef1e3274751fdcbe567046b361265d12808599 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.049482797501199056, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019059242917520388}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.07028822776695906, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002492820928227135}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.050539802692113486, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017469478379052526}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.009307183820869624, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0005915386117685121}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.012698668080633723, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0007466714930192209}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.009189516501593525, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0005049910178490766}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.03621618955918932, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00140538497956548}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.0526171116259514, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0018954837026351507}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.03691068397379973, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012531679750741017}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.046090930054903605, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017742451276749082}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.0656234761466232, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002326065080347693}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.0471157693901415, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016276260750980145}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.22270796928381564, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.029433615868403155}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..f18e56536890f9b1a5622ba7c5a30b5b3fde196b --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.007478271052435213, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0008063007869225007}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.010338951290674275, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0010687996383989403}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.007351567651326997, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0007412176546731157}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0013879834061599138, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0002237907618586408}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.002245934397481068, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00039931884660781176}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0014450651061614851, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0002191123197517165}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.005604377982811, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0006037717129781307}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.007942619745679938, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0008436730401849616}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.005480459085572166, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0005436419168699393}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.007131566619622942, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0007759264592303796}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.009791040555433658, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0010166014822588294}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.006967006053774628, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0007050533365556994}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.997473456123696e-08, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.002855650120767e-07}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..721c45ab71b55be3a66af32e03224b8a6a5f8c3e --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 1.309497335599097, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.023324215467998514}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.11928395058889167, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0026720430430010717}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.16222047702577053, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002573881001494484}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.12101569116712643, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018859465533766812}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.01996887174584161, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008462437123245745}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.02965977606050867, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001033586571455221}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.02190886095908555, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007251164901007362}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.0972026278015815, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0024157240054608615}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.1287653818656058, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002033304125683539}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.09561805145503208, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014452773316927124}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.1075291758702482, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0025162153224772906}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.14428075183193284, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002300879817943218}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.10772552310984851, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016823465430055036}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..8f4f1f884d34e051cecc49513f8003cdd01fb447 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 7.230957749576389, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0536425469915919}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.34380888996516695, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0030845076484356158}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.447391658162999, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002727984781486933}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3592817925524962, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021198922639512987}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.14545103598427403, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0019947160057053256}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.18921875166954605, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0020477910004319416}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.15054262500569862, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015981728794968756}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2533789645650362, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002514469484712738}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.33025523426001224, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002291380183574316}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2638992015247686, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017193130894710778}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.2918162013801523, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0027922449703006685}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3811978300988754, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026251491058964013}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3053449527328775, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002014422999339484}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..95a62ab71481d1d3beb09f6c0883466facec4368 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.80649360056355, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1998199512362247}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4618975292968109, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0033374021778200306}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.44185113042812146, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027208355753659172}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4233941396922909, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002240259708210042}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.21720316360476427, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0023932535396076963}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.20548913402282043, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0020643048503938386}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.19638166157139877, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0018136805158363019}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.345686135545352, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0028355066597269933}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.33044345883576104, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023468520325341962}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3159660620207397, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019464502769911136}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3920117254184558, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0030921641172849523}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3756316032841477, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002600519205461284}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.35940536059201766, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021791205035671516}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..f46d7c8de7c9d64db49858855335ce2ecb8d8264 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.91307719639215, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1274857032754034}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4709595396963552, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003227057457923827}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.44897994314565826, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026763988425963594}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.43472700621860616, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021930927799969995}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2252611249009733, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0023859573577785687}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21265122060479416, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002077181955257037}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2054392972212338, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0018449396852071784}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.35320392511807835, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002743833223699648}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.33685020068084837, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002328588288588858}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.32543991881376977, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019275494986348497}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4032258158403475, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0030346167857717155}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3847176304718895, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025700421376888207}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.37211755259775925, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021593105116151728}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..6028b43a272419e9e830d2727fde526b5d323dba --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.895073995415705, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.15213341614493073}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4650093328987851, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031030240695590562}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.453603046375726, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026544370156289954}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4358889598609801, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002183214874104859}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.21937912264430276, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002277471884890991}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21394671208363505, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021088970425982767}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2044223942588151, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0018593650607392539}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.34738539994213957, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0026340554345153535}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.33972816863194827, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002342079191640274}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3254926044349284, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019460417013969558}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.39726620076907726, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0029189292625600117}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3877392144856795, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025612577080022566}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.37230138483200753, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002156573551629483}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..239ac09de058a04d9f81148d064b2e96895fb836 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.984249703645997, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.14605546972985659}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4596711523135132, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0030229942436052165}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4626551599063747, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026402368817322257}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4394110300981441, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002155708933961789}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2193015904368128, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0022187644166033974}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.22067796088896902, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002098400156703052}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.20837071123028594, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0018180763618672092}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3420249015987018, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0025525295785147847}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3451786358998491, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023314269399147035}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3268336987119632, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001906797734845931}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.39378396094073, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002858394052035071}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3964808392544174, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025604225420971832}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3762959528921545, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021396018313958806}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_gem_xsum_article_DOC_summary_0.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e812ce7e0eb5e85ba3d7d96e788301f6667dbe2d --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12832828142164515, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017794562183186251}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.28847248029120043, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003889108647255819}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17444657578502828, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022844654329194137}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.021115950384362318, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000843051310287779}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.04925763881619255, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0020461456356515254}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.029039326805435032, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011554949380146165}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09350128038856384, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012793590377888806}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.21105922988342335, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0028651027111890855}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.12720258223547712, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001648248487654858}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10200423853654914, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013916696816987264}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2313753113336317, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0032368664660586965}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1390205462262644, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001823510668675631}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.997655025281657, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08049545372158354}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_gem_xsum_article_DOC_summary_1.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..04d137955b70e2878f66eef839c18a6f48a7375d --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1309454764999026, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001827765049519732}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.29700562382894197, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003795399616335189}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17768393062360832, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022349506141921644}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02041569980816869, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008450735436051835}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.04822240605480935, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0019777747068750423}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.027990512381062316, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001130566656515218}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09504020604087868, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013599947712725539}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2162072871160676, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002829869659329609}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1288738749109626, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001625277139920424}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10335621277254586, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001462699625038698}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.23614329439124435, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0031713690732049172}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14046128881678455, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017990331974292878}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.9675071405690926, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09958935593288926}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_gem_xsum_article_DOC_summary_2.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..040783002e87083e5636cc099f6e84c819a3dde3 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.13326231738564168, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018541538731038265}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.30653846845415633, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003718784510021167}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1815853317619735, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022198474125888993}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.022289828836057894, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008725918092828604}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.05259029448210306, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021143622321714616}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.030561262010519005, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011776564417043847}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09606073585619543, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001320735780400149}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2222896298147904, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0027767376278209476}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13099347768064226, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015774167795458336}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.105504826402108, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014517045288292944}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.24526632623966604, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0031905602481124952}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14421468208543237, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001795033812855214}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.0366131861525387, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08607955425699379}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_gem_xsum_article_DOC_summary_3.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..86635d42e13b9cdaf0e47180feef163b73dc6d0c --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12940832070901992, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019943586762260035}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2884068479099661, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004068894100326392}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17299896718015717, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024005443718459487}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.020122251087519527, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008493738964290155}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0463800028049885, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0019308344795767856}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.02723037446755515, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011161293152371049}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09345653613534448, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00145180399823862}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2091744165096173, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0029753866994255977}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1247856962494059, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016915785603912935}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10212955921043831, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016013787895265638}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2290005827276144, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0033599851151365936}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13664310066002217, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019261086832577496}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.0158973292814215, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11093743610635416}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_gem_xsum_article_DOC_summary_4.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..64235c466fafb75ac2c8e3d63326e184fb75c2d1 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0373879533361559, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0021810464397006403}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.07150811812236044, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004101431121761528}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.04539068876881627, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002529463308822854}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.005550765385729703, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0005963003468727854}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.011310401420282012, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0010721548649813347}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.007032145297330701, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0006749391536461736}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0280016015013484, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017038515915968166}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.05214073374869573, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0029695500586895698}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.03322213103634567, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018345484180096144}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.03019679894521189, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018216600106999053}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.05685075214207904, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0032708994661166087}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.03607224322510311, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020071211692870355}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.5019536886003719, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1343611351129069}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_gem_xsum_article_DOC_summary_5.json b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..c2bfff5471ade2765aedabb75cd5995d34b737c0 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/agg.4b284b1b9oscar_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0023010225042523016, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0007056279408099138}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.0017639670878076587, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0005179713630676667}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.001950949795538486, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0005800061914629863}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.001755708684944675, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.000517656162281774}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.001338960546022285, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00037496082953111386}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0014822281925852424, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0004217162689453353}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.001800847260371234, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0005272819939622312}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.0013894095420872634, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00039142547685255293}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.001529874466646611, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00043483560412767216}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.0120083486806341e-43, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 2.299599307531863e-38}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..68e4e993f5876d05d2db8e6bdb463adec4fc5aa0 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f5a576c0eb7f779bbaf8f1b2aeb35fc938dd8e591045d585f0d3c6789608da6 +size 4119438 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4adec227d62af887ea4796c032890951e3e3a68b --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0f9faa93c49fbd99e9fcd3f01e27943b5fa221aa79a75afaa970aae2fb078af +size 4869804 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..fbe57c0b47295195f2f9571eb570e162199c585c --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b53150ea7cdbe0fa32933869dd6018c08df9c5d88090f65039c4143cef5e595 +size 5720560 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..827e5900b776b668a22081bf9cfb7edb0f399c47 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5dc0664fff2c715500d222d1c1d503502914828586c81dc68b14304b3e62292 +size 6593874 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..daf958dd47cd86e1a4aa4f89d0b457899267be9c --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f83f2aa603023dea02a746a126fe20e8b4c648a7192dcf32f2ae771eaa581589 +size 7518117 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..618e676bc3d396258dc2a48e2b2152a9b0da47b3 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8145217d9adf90f861709a29aa5941ab3d72e803085cd4717d2ac03076d37f90 +size 8417608 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5030ce2ccf37fa82ad95ebaa4db8ce5d5e6bf0ca --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ac9fb81930624774f0af9804638ccef2b345f5ba12991a0d065ac5d3a371be0 +size 7644487 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a07ababfd188b9da6c91807bd436e91bb3e34a9a --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9033e20d370ea2f889df512abc3071d4e0535af11b12e75fa4f9785512c5f18b +size 13236909 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b13fd3ad705b8e0d1b548f4cb11c0c21771d5bb9 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34ae1f769ad9bc3da46ae2b5a72f444bbd845674078f3cdc39c035318cdf8bf3 +size 18852132 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..912dd9b44f6bd344a8cf6d85bf77aa477810adae --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fda4b35b5f493910116e0f464829940832aeadcc9f3f470db98f4148d06dc1e +size 24291119 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4cf6eb92b4726cc2c9009b96b526121f31250bfc --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bb9d7377d490990ba2c508cc2da32c9f4ce4c79f21fdfb007e6663b8afbe089 +size 29461686 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c663c7674eccdc5eacbf7de13fa3e825cd6d3397 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8a6c55761d1858427857cc3d614c7c9a26fef6a7ef46f0b647de89584b8b865 +size 34798037 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..51d56b065e34ec792246a68bf3a32c233ad33a44 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17d386d13c1b250a218dc66d6575a84a59a2c6daafbff5cb828e5eff7d321ef9 +size 4141362 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1662e6122c94cfbc04ceb5f683a27627f9abe2e5 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5177bf7e02c86e3a44223fc796a82dd12a27eb473569b21f703f47ccb685a49f +size 5311652 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f046954b2403e200311c2c9fb0b6c4f852a4cf31 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e457ea2b60034840e35a86827fe907b4a53c2bcef884e6843f3392845417eba5 +size 6200216 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..45a928374772f9059ac6fc1ea6fbe969fd53bb52 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d22283bf5fc26ef999fca0a7fdbe3fcf67b395bedb19d85d5d26bfd9a006350d +size 7267041 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1f9e761cba81a2534cdd0b1106e962f3f353d7ba --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b698c65320e3e8e13db873b4e9b152735b01967a7d1317e0ec6977b68e1da12f +size 8350544 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6fc8edc3edaaaf14cf70b4bbe20545388e45b8c4 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd5b02a169d5a5fe095ce848d40d893a2e852c77fb93cb5604d85c80a194b471 +size 9447281 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_0.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..9b4ec32511091495f6ee6bde7213e6f4d108cfbb --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e76a0766450e3ea899db92a81543d2b9a635a99840d7790f97f292c2520d38a3 +size 2817367 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_1.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0ad8d416b79fa9ec73739146ebb8de273717fbd6 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5abef03f2fef8a8e4a1a97bf6d1d5c0684fd7638e11ff0bcbb913ab663f457cb +size 5088717 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_2.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..55afbb1645376953d96c62c3f225be85595a4303 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e67cfdfb89b82e881a06b18b7abb240d993451692c114997d553bd114d1292c +size 7366819 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_3.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3da8b8b8649c0c60caf4be8f0cdcaf63f51d4cd3 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e88d3cf49e602e641a8a0fcc2a93b4a22fbb834100bfe566647403f3b38e8b6 +size 9635577 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_4.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1b734b39594e142967dd31431984a27ace64bd62 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47d9bde9b796c8016a005232d87759fbe21d1ac2c500efde0c2d4e6424b56df3 +size 11671902 diff --git a/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_5.jsonl b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0e949ed4d2902641ef29bd785ae2d222b9764558 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/examples.4b284b1b9oscar_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b97ce08d35fa54040403dfce45df683beb490e6679164047411b3791ab488d2 +size 13897356 diff --git a/4b284b1b9oscar/evaluation/generation/merged.csv b/4b284b1b9oscar/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..aec441831fd8981b84cad166b35624c6951e481b --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/merged.csv @@ -0,0 +1,53 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.02190886095908555 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.02190886095908555 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.15054262500569862 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.15054262500569862 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.19638166157139877 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.19638166157139877 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.2054392972212338 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.2054392972212338 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.2044223942588151 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.2044223942588151 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.20837071123028594 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.20837071123028594 +e2e_nlg_cleaned,5,average,multiple,0.1645109250410863 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.029039326805435032 +gem_xsum,0,median,rouge2_fmeasure,0.029039326805435032 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.027990512381062316 +gem_xsum,1,median,rouge2_fmeasure,0.027990512381062316 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.030561262010519005 +gem_xsum,2,median,rouge2_fmeasure,0.030561262010519005 +gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.02723037446755515 +gem_xsum,3,median,rouge2_fmeasure,0.02723037446755515 +gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.007032145297330701 +gem_xsum,4,median,rouge2_fmeasure,0.007032145297330701 +gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.0 +gem_xsum,5,median,rouge2_fmeasure,0.0 +gem_xsum,5,average,multiple,0.0203089368269837 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.029457430490114032 +web_nlg_en,0,median,rouge2_fmeasure,0.029457430490114032 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.03553245669340435 +web_nlg_en,1,median,rouge2_fmeasure,0.03553245669340435 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.03910067067467762 +web_nlg_en,2,median,rouge2_fmeasure,0.03910067067467762 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.04302598363295129 +web_nlg_en,3,median,rouge2_fmeasure,0.04302598363295129 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.042594714406787165 +web_nlg_en,4,median,rouge2_fmeasure,0.042594714406787165 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.04130600915194189 +web_nlg_en,5,median,rouge2_fmeasure,0.04130600915194189 +web_nlg_en,5,average,multiple,0.03850287750831272 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.027643924254134603 +wiki_lingua_en,0,median,rouge2_fmeasure,0.027643924254134603 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.03265176701451356 +wiki_lingua_en,1,median,rouge2_fmeasure,0.03265176701451356 +wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.033509423859662844 +wiki_lingua_en,2,median,rouge2_fmeasure,0.033509423859662844 +wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.02732982658717203 +wiki_lingua_en,3,median,rouge2_fmeasure,0.02732982658717203 +wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.009189516501593525 +wiki_lingua_en,4,median,rouge2_fmeasure,0.009189516501593525 +wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.0014450651061614851 +wiki_lingua_en,5,median,rouge2_fmeasure,0.0014450651061614851 +wiki_lingua_en,5,average,multiple,0.021961587220539674 diff --git a/4b284b1b9oscar/evaluation/generation/merged.json b/4b284b1b9oscar/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..f0c8b2680821769fe2dafb7b61446ee2f5368530 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.3035990566203564, "bleu_stderr": 0.025090566187709752, "rouge1_fmeasure": 0.08651516220636073, "rouge1_fmeasure_stderr": 0.0018421075247631034, "rouge1_precision": 0.071329758776339, "rouge1_precision_stderr": 0.00279942361165936, "rouge1_recall": 0.2777833537640477, "rouge1_recall_stderr": 0.005021363310584012, "rouge2_fmeasure": 0.029457430490114032, "rouge2_fmeasure_stderr": 0.0010438331217221088, "rouge2_precision": 0.02493593159722908, "rouge2_precision_stderr": 0.0015907952635559632, "rouge2_recall": 0.09479553172438937, "rouge2_recall_stderr": 0.0029506060980076265, "rougeL_fmeasure": 0.07406437697939146, "rougeL_fmeasure_stderr": 0.0015395345437139562, "rougeL_precision": 0.06175148366384243, "rougeL_precision_stderr": 0.002527555333736909, "rougeL_recall": 0.2437824603111534, "rougeL_recall_stderr": 0.004509160724470269, "rougeLsum_fmeasure": 0.07865092467105374, "rougeLsum_fmeasure_stderr": 0.0016703135405487922, "rougeLsum_precision": 0.06515539016564718, "rougeLsum_precision_stderr": 0.0025912111251545702, "rougeLsum_recall": 0.2540442770643496, "rougeLsum_recall_stderr": 0.00462671195388165}}, "1": {"PALM_prompt": {"bleu": 0.425747629657599, "bleu_stderr": 0.019098717536100474, "rouge1_fmeasure": 0.09915747457632551, "rouge1_fmeasure_stderr": 0.0020735345455021683, "rouge1_precision": 0.07869000641860335, "rouge1_precision_stderr": 0.002574141434973694, "rouge1_recall": 0.27911697917731965, "rouge1_recall_stderr": 0.005025828797632534, "rouge2_fmeasure": 0.03553245669340435, "rouge2_fmeasure_stderr": 0.0012297768666432714, "rouge2_precision": 0.028711039922457098, "rouge2_precision_stderr": 0.0015895748345510915, "rouge2_recall": 0.1016349747426781, "rouge2_recall_stderr": 0.003064263260383757, "rougeL_fmeasure": 0.08430815534591073, "rougeL_fmeasure_stderr": 0.001735358065989058, "rougeL_precision": 0.06784822137078164, "rougeL_precision_stderr": 0.0023584286957804, "rougeL_recall": 0.24104415879973046, "rougeL_recall_stderr": 0.004392721456408033, "rougeLsum_fmeasure": 0.09052335683054723, "rougeLsum_fmeasure_stderr": 0.00188465696521615, "rougeLsum_precision": 0.07247904169290792, "rougeLsum_precision_stderr": 0.002450321126322307, "rougeLsum_recall": 0.25603235118880574, "rougeLsum_recall_stderr": 0.004615086249365793}}, "2": {"PALM_prompt": {"bleu": 0.4497583704772655, "bleu_stderr": 0.020681936257570407, "rouge1_fmeasure": 0.10711351422120703, "rouge1_fmeasure_stderr": 0.0024517943039154802, "rouge1_precision": 0.08676474022374367, "rouge1_precision_stderr": 0.0030356563200589527, "rouge1_recall": 0.28565036099040625, "rouge1_recall_stderr": 0.005160364852348898, "rouge2_fmeasure": 0.03910067067467762, "rouge2_fmeasure_stderr": 0.0014210269756776363, "rouge2_precision": 0.03205343730461677, "rouge2_precision_stderr": 0.001723196140481487, "rouge2_recall": 0.10665226766319001, "rouge2_recall_stderr": 0.0031321051228955267, "rougeL_fmeasure": 0.08897314932870945, "rougeL_fmeasure_stderr": 0.002002929328501285, "rougeL_precision": 0.07292425907812133, "rougeL_precision_stderr": 0.002682288331233897, "rougeL_recall": 0.2418993456910343, "rougeL_recall_stderr": 0.004387413324828132, "rougeLsum_fmeasure": 0.09589616680302177, "rougeLsum_fmeasure_stderr": 0.0021426419270798853, "rougeLsum_precision": 0.07776458484873876, "rougeLsum_precision_stderr": 0.002744825042381609, "rougeLsum_recall": 0.25905556991925294, "rougeLsum_recall_stderr": 0.004682330002575584}}, "3": {"PALM_prompt": {"bleu": 0.5453566942766312, "bleu_stderr": 0.03174339868079995, "rouge1_fmeasure": 0.11381502730552777, "rouge1_fmeasure_stderr": 0.0025266791277412273, "rouge1_precision": 0.09141520582826082, "rouge1_precision_stderr": 0.0030271528036140147, "rouge1_recall": 0.2946460917400917, "rouge1_recall_stderr": 0.005150457597998139, "rouge2_fmeasure": 0.04302598363295129, "rouge2_fmeasure_stderr": 0.0015803110546547487, "rouge2_precision": 0.0349533732864018, "rouge2_precision_stderr": 0.0018089338825247128, "rouge2_recall": 0.1132672221907378, "rouge2_recall_stderr": 0.0032322633657986535, "rougeL_fmeasure": 0.09476653245926525, "rougeL_fmeasure_stderr": 0.002130119160105199, "rougeL_precision": 0.07724838020684321, "rougeL_precision_stderr": 0.0027324213899579644, "rougeL_recall": 0.24881404393817505, "rougeL_recall_stderr": 0.004406171113605123, "rougeLsum_fmeasure": 0.10301268965900799, "rougeLsum_fmeasure_stderr": 0.0022888513790911423, "rougeLsum_precision": 0.0833829754674534, "rougeLsum_precision_stderr": 0.0028479312887177617, "rougeLsum_recall": 0.26789842816421516, "rougeLsum_recall_stderr": 0.00469224168355405}}, "4": {"PALM_prompt": {"bleu": 0.552842738936437, "bleu_stderr": 0.031220316118742313, "rouge1_fmeasure": 0.1125896095390658, "rouge1_fmeasure_stderr": 0.0024441626752801536, "rouge1_precision": 0.0904044344997309, "rouge1_precision_stderr": 0.0028870247747819445, "rouge1_recall": 0.30097906504674915, "rouge1_recall_stderr": 0.005237112327131232, "rouge2_fmeasure": 0.042594714406787165, "rouge2_fmeasure_stderr": 0.0014574874865349483, "rouge2_precision": 0.03357915742500351, "rouge2_precision_stderr": 0.001563192087212674, "rouge2_recall": 0.1186975703608361, "rouge2_recall_stderr": 0.0033758949815214734, "rougeL_fmeasure": 0.09294924226115779, "rougeL_fmeasure_stderr": 0.00201851881067649, "rougeL_precision": 0.07544711584950896, "rougeL_precision_stderr": 0.0025299603142831984, "rougeL_recall": 0.2529660247399177, "rougeL_recall_stderr": 0.00445147947055177, "rougeLsum_fmeasure": 0.10127472230162189, "rougeLsum_fmeasure_stderr": 0.002166709168455675, "rougeLsum_precision": 0.08174948336092744, "rougeLsum_precision_stderr": 0.0026566402566456145, "rougeLsum_recall": 0.2733792203624409, "rougeLsum_recall_stderr": 0.0047675031230854}}, "5": {"PALM_prompt": {"bleu": 0.5160808451457419, "bleu_stderr": 0.028152585581808363, "rouge1_fmeasure": 0.11267246257206415, "rouge1_fmeasure_stderr": 0.0023161203363087435, "rouge1_precision": 0.08756298477917958, "rouge1_precision_stderr": 0.002702960483622272, "rouge1_recall": 0.30943226003927954, "rouge1_recall_stderr": 0.00537568452081882, "rouge2_fmeasure": 0.04130600915194189, "rouge2_fmeasure_stderr": 0.0014050088099057468, "rouge2_precision": 0.031279144513968335, "rouge2_precision_stderr": 0.0015413777797901, "rouge2_recall": 0.1215282455226915, "rouge2_recall_stderr": 0.003458287142794445, "rougeL_fmeasure": 0.09293487391814521, "rougeL_fmeasure_stderr": 0.0018937867038700312, "rougeL_precision": 0.0727149677685351, "rougeL_precision_stderr": 0.002357535066892359, "rougeL_recall": 0.25979581419981984, "rougeL_recall_stderr": 0.004554297207344822, "rougeLsum_fmeasure": 0.10164495184500182, "rougeLsum_fmeasure_stderr": 0.0020419190457151644, "rougeLsum_precision": 0.07890883384983154, "rougeLsum_precision_stderr": 0.002452737865418059, "rougeLsum_recall": 0.28252744959181614, "rougeLsum_recall_stderr": 0.004927414464655944}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.159384502447796, "bleu_stderr": 0.057628180591426645, "rouge1_fmeasure": 0.16612440507868828, "rouge1_fmeasure_stderr": 0.0017714330657529222, "rouge1_precision": 0.15144825263093634, "rouge1_precision_stderr": 0.001983783278782952, "rouge1_recall": 0.22534109695497295, "rouge1_recall_stderr": 0.002481691416374552, "rouge2_fmeasure": 0.027643924254134603, "rouge2_fmeasure_stderr": 0.0007121708145651539, "rouge2_precision": 0.024905925069722477, "rouge2_precision_stderr": 0.0006850846534012076, "rouge2_recall": 0.03850478234485377, "rouge2_recall_stderr": 0.0011024526272317378, "rougeL_fmeasure": 0.12276816133742628, "rougeL_fmeasure_stderr": 0.0012192289120582331, "rougeL_precision": 0.11125836759667614, "rougeL_precision_stderr": 0.00142424299423556, "rougeL_recall": 0.17033205247937977, "rougeL_recall_stderr": 0.0019231978134307691, "rougeLsum_fmeasure": 0.15558334623949294, "rougeLsum_fmeasure_stderr": 0.0016443580462993418, "rougeLsum_precision": 0.14179043128628907, "rougeLsum_precision_stderr": 0.0018541893135933546, "rougeLsum_recall": 0.21137913675901987, "rougeLsum_recall_stderr": 0.0023233022426073892}}, "1": {"tldr_en": {"bleu": 1.566708990629026, "bleu_stderr": 0.0581496436272751, "rouge1_fmeasure": 0.1816842303684298, "rouge1_fmeasure_stderr": 0.0017782880793874537, "rouge1_precision": 0.17371296302390632, "rouge1_precision_stderr": 0.0021902383124749454, "rouge1_recall": 0.24147579886101558, "rouge1_recall_stderr": 0.0024751615706129063, "rouge2_fmeasure": 0.03265176701451356, "rouge2_fmeasure_stderr": 0.0007878736261592252, "rouge2_precision": 0.03192092546391988, "rouge2_precision_stderr": 0.0009424962628309825, "rouge2_recall": 0.04410602388358206, "rouge2_recall_stderr": 0.0011954069713593922, "rougeL_fmeasure": 0.13015162278257636, "rougeL_fmeasure_stderr": 0.0012020872378512297, "rougeL_precision": 0.12465533551452404, "rougeL_precision_stderr": 0.0015982129307706894, "rougeL_recall": 0.17675811341682113, "rougeL_recall_stderr": 0.0019268394653393782, "rougeLsum_fmeasure": 0.17077057715538618, "rougeLsum_fmeasure_stderr": 0.0016691467024742542, "rougeLsum_precision": 0.1631041776023868, "rougeLsum_precision_stderr": 0.0020525153232724904, "rougeLsum_recall": 0.22761644537805767, "rougeLsum_recall_stderr": 0.0023639550060386397}}, "2": {"tldr_en": {"bleu": 1.5566151429887363, "bleu_stderr": 0.07263045479067322, "rouge1_fmeasure": 0.18745443354388727, "rouge1_fmeasure_stderr": 0.0017296949460870405, "rouge1_precision": 0.17743624737565108, "rouge1_precision_stderr": 0.0021492258023722674, "rouge1_recall": 0.25150886158134367, "rouge1_recall_stderr": 0.0024524846458276782, "rouge2_fmeasure": 0.033509423859662844, "rouge2_fmeasure_stderr": 0.0007929018957245757, "rouge2_precision": 0.03283000534133716, "rouge2_precision_stderr": 0.0009328095980555773, "rouge2_recall": 0.045825393377754105, "rouge2_recall_stderr": 0.0012602521826330568, "rougeL_fmeasure": 0.1336204206295648, "rougeL_fmeasure_stderr": 0.0011901208386536995, "rougeL_precision": 0.12645353945710797, "rougeL_precision_stderr": 0.0015870180893584427, "rougeL_recall": 0.18352284038906627, "rougeL_recall_stderr": 0.0019514738060420578, "rougeLsum_fmeasure": 0.17608197313625737, "rougeLsum_fmeasure_stderr": 0.0016179873786064413, "rougeLsum_precision": 0.16653674072514268, "rougeLsum_precision_stderr": 0.002024987535804069, "rougeLsum_recall": 0.23696286031880665, "rougeLsum_recall_stderr": 0.002325990094088013}}, "3": {"tldr_en": {"bleu": 1.5090266791250284, "bleu_stderr": 0.06924033448041976, "rouge1_fmeasure": 0.15441643686495948, "rouge1_fmeasure_stderr": 0.0020001231144296736, "rouge1_precision": 0.14740810337408072, "rouge1_precision_stderr": 0.002271679945302172, "rouge1_recall": 0.20836892569223942, "rouge1_recall_stderr": 0.0028639121415319447, "rouge2_fmeasure": 0.02732982658717203, "rouge2_fmeasure_stderr": 0.0007317865399481251, "rouge2_precision": 0.026151374582378446, "rouge2_precision_stderr": 0.0007896206739810243, "rouge2_recall": 0.037574793035193066, "rouge2_recall_stderr": 0.0011612525965493635, "rougeL_fmeasure": 0.10993608037589384, "rougeL_fmeasure_stderr": 0.0013690145372151107, "rougeL_precision": 0.10492025586641264, "rougeL_precision_stderr": 0.0015968039001781839, "rougeL_recall": 0.15175102080784733, "rougeL_recall_stderr": 0.0021792866520934837, "rougeLsum_fmeasure": 0.14475462836497524, "rougeLsum_fmeasure_stderr": 0.0018689106719346205, "rougeLsum_precision": 0.13823688941444, "rougeLsum_precision_stderr": 0.002132419884185906, "rougeLsum_recall": 0.1956605692982594, "rougeLsum_recall_stderr": 0.002692622620180876}}, "4": {"tldr_en": {"bleu": 0.22270796928381564, "bleu_stderr": 0.029433615868403155, "rouge1_fmeasure": 0.050539802692113486, "rouge1_fmeasure_stderr": 0.0017469478379052526, "rouge1_precision": 0.049482797501199056, "rouge1_precision_stderr": 0.0019059242917520388, "rouge1_recall": 0.07028822776695906, "rouge1_recall_stderr": 0.002492820928227135, "rouge2_fmeasure": 0.009189516501593525, "rouge2_fmeasure_stderr": 0.0005049910178490766, "rouge2_precision": 0.009307183820869624, "rouge2_precision_stderr": 0.0005915386117685121, "rouge2_recall": 0.012698668080633723, "rouge2_recall_stderr": 0.0007466714930192209, "rougeL_fmeasure": 0.03691068397379973, "rougeL_fmeasure_stderr": 0.0012531679750741017, "rougeL_precision": 0.03621618955918932, "rougeL_precision_stderr": 0.00140538497956548, "rougeL_recall": 0.0526171116259514, "rougeL_recall_stderr": 0.0018954837026351507, "rougeLsum_fmeasure": 0.0471157693901415, "rougeLsum_fmeasure_stderr": 0.0016276260750980145, "rougeLsum_precision": 0.046090930054903605, "rougeLsum_precision_stderr": 0.0017742451276749082, "rougeLsum_recall": 0.0656234761466232, "rougeLsum_recall_stderr": 0.002326065080347693}}, "5": {"tldr_en": {"bleu": 3.997473456123696e-08, "bleu_stderr": 1.002855650120767e-07, "rouge1_fmeasure": 0.007351567651326997, "rouge1_fmeasure_stderr": 0.0007412176546731157, "rouge1_precision": 0.007478271052435213, "rouge1_precision_stderr": 0.0008063007869225007, "rouge1_recall": 0.010338951290674275, "rouge1_recall_stderr": 0.0010687996383989403, "rouge2_fmeasure": 0.0014450651061614851, "rouge2_fmeasure_stderr": 0.0002191123197517165, "rouge2_precision": 0.0013879834061599138, "rouge2_precision_stderr": 0.0002237907618586408, "rouge2_recall": 0.002245934397481068, "rouge2_recall_stderr": 0.00039931884660781176, "rougeL_fmeasure": 0.005480459085572166, "rougeL_fmeasure_stderr": 0.0005436419168699393, "rougeL_precision": 0.005604377982811, "rougeL_precision_stderr": 0.0006037717129781307, "rougeL_recall": 0.007942619745679938, "rougeL_recall_stderr": 0.0008436730401849616, "rougeLsum_fmeasure": 0.006967006053774628, "rougeLsum_fmeasure_stderr": 0.0007050533365556994, "rougeLsum_precision": 0.007131566619622942, "rougeLsum_precision_stderr": 0.0007759264592303796, "rougeLsum_recall": 0.009791040555433658, "rougeLsum_recall_stderr": 0.0010166014822588294}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 1.309497335599097, "bleu_stderr": 0.023324215467998514, "rouge1_fmeasure": 0.12101569116712643, "rouge1_fmeasure_stderr": 0.0018859465533766812, "rouge1_precision": 0.11928395058889167, "rouge1_precision_stderr": 0.0026720430430010717, "rouge1_recall": 0.16222047702577053, "rouge1_recall_stderr": 0.002573881001494484, "rouge2_fmeasure": 0.02190886095908555, "rouge2_fmeasure_stderr": 0.0007251164901007362, "rouge2_precision": 0.01996887174584161, "rouge2_precision_stderr": 0.0008462437123245745, "rouge2_recall": 0.02965977606050867, "rouge2_recall_stderr": 0.001033586571455221, "rougeL_fmeasure": 0.09561805145503208, "rougeL_fmeasure_stderr": 0.0014452773316927124, "rougeL_precision": 0.0972026278015815, "rougeL_precision_stderr": 0.0024157240054608615, "rougeL_recall": 0.1287653818656058, "rougeL_recall_stderr": 0.002033304125683539, "rougeLsum_fmeasure": 0.10772552310984851, "rougeLsum_fmeasure_stderr": 0.0016823465430055036, "rougeLsum_precision": 0.1075291758702482, "rougeLsum_precision_stderr": 0.0025162153224772906, "rougeLsum_recall": 0.14428075183193284, "rougeLsum_recall_stderr": 0.002300879817943218}}, "1": {"generate_text_restaurant": {"bleu": 7.230957749576389, "bleu_stderr": 0.0536425469915919, "rouge1_fmeasure": 0.3592817925524962, "rouge1_fmeasure_stderr": 0.0021198922639512987, "rouge1_precision": 0.34380888996516695, "rouge1_precision_stderr": 0.0030845076484356158, "rouge1_recall": 0.447391658162999, "rouge1_recall_stderr": 0.002727984781486933, "rouge2_fmeasure": 0.15054262500569862, "rouge2_fmeasure_stderr": 0.0015981728794968756, "rouge2_precision": 0.14545103598427403, "rouge2_precision_stderr": 0.0019947160057053256, "rouge2_recall": 0.18921875166954605, "rouge2_recall_stderr": 0.0020477910004319416, "rougeL_fmeasure": 0.2638992015247686, "rougeL_fmeasure_stderr": 0.0017193130894710778, "rougeL_precision": 0.2533789645650362, "rougeL_precision_stderr": 0.002514469484712738, "rougeL_recall": 0.33025523426001224, "rougeL_recall_stderr": 0.002291380183574316, "rougeLsum_fmeasure": 0.3053449527328775, "rougeLsum_fmeasure_stderr": 0.002014422999339484, "rougeLsum_precision": 0.2918162013801523, "rougeLsum_precision_stderr": 0.0027922449703006685, "rougeLsum_recall": 0.3811978300988754, "rougeLsum_recall_stderr": 0.0026251491058964013}}, "2": {"generate_text_restaurant": {"bleu": 11.80649360056355, "bleu_stderr": 0.1998199512362247, "rouge1_fmeasure": 0.4233941396922909, "rouge1_fmeasure_stderr": 0.002240259708210042, "rouge1_precision": 0.4618975292968109, "rouge1_precision_stderr": 0.0033374021778200306, "rouge1_recall": 0.44185113042812146, "rouge1_recall_stderr": 0.0027208355753659172, "rouge2_fmeasure": 0.19638166157139877, "rouge2_fmeasure_stderr": 0.0018136805158363019, "rouge2_precision": 0.21720316360476427, "rouge2_precision_stderr": 0.0023932535396076963, "rouge2_recall": 0.20548913402282043, "rouge2_recall_stderr": 0.0020643048503938386, "rougeL_fmeasure": 0.3159660620207397, "rougeL_fmeasure_stderr": 0.0019464502769911136, "rougeL_precision": 0.345686135545352, "rougeL_precision_stderr": 0.0028355066597269933, "rougeL_recall": 0.33044345883576104, "rougeL_recall_stderr": 0.0023468520325341962, "rougeLsum_fmeasure": 0.35940536059201766, "rougeLsum_fmeasure_stderr": 0.0021791205035671516, "rougeLsum_precision": 0.3920117254184558, "rougeLsum_precision_stderr": 0.0030921641172849523, "rougeLsum_recall": 0.3756316032841477, "rougeLsum_recall_stderr": 0.002600519205461284}}, "3": {"generate_text_restaurant": {"bleu": 12.91307719639215, "bleu_stderr": 0.1274857032754034, "rouge1_fmeasure": 0.43472700621860616, "rouge1_fmeasure_stderr": 0.0021930927799969995, "rouge1_precision": 0.4709595396963552, "rouge1_precision_stderr": 0.003227057457923827, "rouge1_recall": 0.44897994314565826, "rouge1_recall_stderr": 0.0026763988425963594, "rouge2_fmeasure": 0.2054392972212338, "rouge2_fmeasure_stderr": 0.0018449396852071784, "rouge2_precision": 0.2252611249009733, "rouge2_precision_stderr": 0.0023859573577785687, "rouge2_recall": 0.21265122060479416, "rouge2_recall_stderr": 0.002077181955257037, "rougeL_fmeasure": 0.32543991881376977, "rougeL_fmeasure_stderr": 0.0019275494986348497, "rougeL_precision": 0.35320392511807835, "rougeL_precision_stderr": 0.002743833223699648, "rougeL_recall": 0.33685020068084837, "rougeL_recall_stderr": 0.002328588288588858, "rougeLsum_fmeasure": 0.37211755259775925, "rougeLsum_fmeasure_stderr": 0.0021593105116151728, "rougeLsum_precision": 0.4032258158403475, "rougeLsum_precision_stderr": 0.0030346167857717155, "rougeLsum_recall": 0.3847176304718895, "rougeLsum_recall_stderr": 0.0025700421376888207}}, "4": {"generate_text_restaurant": {"bleu": 12.895073995415705, "bleu_stderr": 0.15213341614493073, "rouge1_fmeasure": 0.4358889598609801, "rouge1_fmeasure_stderr": 0.002183214874104859, "rouge1_precision": 0.4650093328987851, "rouge1_precision_stderr": 0.0031030240695590562, "rouge1_recall": 0.453603046375726, "rouge1_recall_stderr": 0.0026544370156289954, "rouge2_fmeasure": 0.2044223942588151, "rouge2_fmeasure_stderr": 0.0018593650607392539, "rouge2_precision": 0.21937912264430276, "rouge2_precision_stderr": 0.002277471884890991, "rouge2_recall": 0.21394671208363505, "rouge2_recall_stderr": 0.0021088970425982767, "rougeL_fmeasure": 0.3254926044349284, "rougeL_fmeasure_stderr": 0.0019460417013969558, "rougeL_precision": 0.34738539994213957, "rougeL_precision_stderr": 0.0026340554345153535, "rougeL_recall": 0.33972816863194827, "rougeL_recall_stderr": 0.002342079191640274, "rougeLsum_fmeasure": 0.37230138483200753, "rougeLsum_fmeasure_stderr": 0.002156573551629483, "rougeLsum_precision": 0.39726620076907726, "rougeLsum_precision_stderr": 0.0029189292625600117, "rougeLsum_recall": 0.3877392144856795, "rougeLsum_recall_stderr": 0.0025612577080022566}}, "5": {"generate_text_restaurant": {"bleu": 12.984249703645997, "bleu_stderr": 0.14605546972985659, "rouge1_fmeasure": 0.4394110300981441, "rouge1_fmeasure_stderr": 0.002155708933961789, "rouge1_precision": 0.4596711523135132, "rouge1_precision_stderr": 0.0030229942436052165, "rouge1_recall": 0.4626551599063747, "rouge1_recall_stderr": 0.0026402368817322257, "rouge2_fmeasure": 0.20837071123028594, "rouge2_fmeasure_stderr": 0.0018180763618672092, "rouge2_precision": 0.2193015904368128, "rouge2_precision_stderr": 0.0022187644166033974, "rouge2_recall": 0.22067796088896902, "rouge2_recall_stderr": 0.002098400156703052, "rougeL_fmeasure": 0.3268336987119632, "rougeL_fmeasure_stderr": 0.001906797734845931, "rougeL_precision": 0.3420249015987018, "rougeL_precision_stderr": 0.0025525295785147847, "rougeL_recall": 0.3451786358998491, "rougeL_recall_stderr": 0.0023314269399147035, "rougeLsum_fmeasure": 0.3762959528921545, "rougeLsum_fmeasure_stderr": 0.0021396018313958806, "rougeLsum_precision": 0.39378396094073, "rougeLsum_precision_stderr": 0.002858394052035071, "rougeLsum_recall": 0.3964808392544174, "rougeLsum_recall_stderr": 0.0025604225420971832}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 0.997655025281657, "bleu_stderr": 0.08049545372158354, "rouge1_fmeasure": 0.17444657578502828, "rouge1_fmeasure_stderr": 0.0022844654329194137, "rouge1_precision": 0.12832828142164515, "rouge1_precision_stderr": 0.0017794562183186251, "rouge1_recall": 0.28847248029120043, "rouge1_recall_stderr": 0.003889108647255819, "rouge2_fmeasure": 0.029039326805435032, "rouge2_fmeasure_stderr": 0.0011554949380146165, "rouge2_precision": 0.021115950384362318, "rouge2_precision_stderr": 0.000843051310287779, "rouge2_recall": 0.04925763881619255, "rouge2_recall_stderr": 0.0020461456356515254, "rougeL_fmeasure": 0.12720258223547712, "rougeL_fmeasure_stderr": 0.001648248487654858, "rougeL_precision": 0.09350128038856384, "rougeL_precision_stderr": 0.0012793590377888806, "rougeL_recall": 0.21105922988342335, "rougeL_recall_stderr": 0.0028651027111890855, "rougeLsum_fmeasure": 0.1390205462262644, "rougeLsum_fmeasure_stderr": 0.001823510668675631, "rougeLsum_precision": 0.10200423853654914, "rougeLsum_precision_stderr": 0.0013916696816987264, "rougeLsum_recall": 0.2313753113336317, "rougeLsum_recall_stderr": 0.0032368664660586965}}, "1": {"article_DOC_summary": {"bleu": 0.9675071405690926, "bleu_stderr": 0.09958935593288926, "rouge1_fmeasure": 0.17768393062360832, "rouge1_fmeasure_stderr": 0.0022349506141921644, "rouge1_precision": 0.1309454764999026, "rouge1_precision_stderr": 0.001827765049519732, "rouge1_recall": 0.29700562382894197, "rouge1_recall_stderr": 0.003795399616335189, "rouge2_fmeasure": 0.027990512381062316, "rouge2_fmeasure_stderr": 0.001130566656515218, "rouge2_precision": 0.02041569980816869, "rouge2_precision_stderr": 0.0008450735436051835, "rouge2_recall": 0.04822240605480935, "rouge2_recall_stderr": 0.0019777747068750423, "rougeL_fmeasure": 0.1288738749109626, "rougeL_fmeasure_stderr": 0.001625277139920424, "rougeL_precision": 0.09504020604087868, "rougeL_precision_stderr": 0.0013599947712725539, "rougeL_recall": 0.2162072871160676, "rougeL_recall_stderr": 0.002829869659329609, "rougeLsum_fmeasure": 0.14046128881678455, "rougeLsum_fmeasure_stderr": 0.0017990331974292878, "rougeLsum_precision": 0.10335621277254586, "rougeLsum_precision_stderr": 0.001462699625038698, "rougeLsum_recall": 0.23614329439124435, "rougeLsum_recall_stderr": 0.0031713690732049172}}, "2": {"article_DOC_summary": {"bleu": 1.0366131861525387, "bleu_stderr": 0.08607955425699379, "rouge1_fmeasure": 0.1815853317619735, "rouge1_fmeasure_stderr": 0.0022198474125888993, "rouge1_precision": 0.13326231738564168, "rouge1_precision_stderr": 0.0018541538731038265, "rouge1_recall": 0.30653846845415633, "rouge1_recall_stderr": 0.003718784510021167, "rouge2_fmeasure": 0.030561262010519005, "rouge2_fmeasure_stderr": 0.0011776564417043847, "rouge2_precision": 0.022289828836057894, "rouge2_precision_stderr": 0.0008725918092828604, "rouge2_recall": 0.05259029448210306, "rouge2_recall_stderr": 0.0021143622321714616, "rougeL_fmeasure": 0.13099347768064226, "rougeL_fmeasure_stderr": 0.0015774167795458336, "rougeL_precision": 0.09606073585619543, "rougeL_precision_stderr": 0.001320735780400149, "rougeL_recall": 0.2222896298147904, "rougeL_recall_stderr": 0.0027767376278209476, "rougeLsum_fmeasure": 0.14421468208543237, "rougeLsum_fmeasure_stderr": 0.001795033812855214, "rougeLsum_precision": 0.105504826402108, "rougeLsum_precision_stderr": 0.0014517045288292944, "rougeLsum_recall": 0.24526632623966604, "rougeLsum_recall_stderr": 0.0031905602481124952}}, "3": {"article_DOC_summary": {"bleu": 1.0158973292814215, "bleu_stderr": 0.11093743610635416, "rouge1_fmeasure": 0.17299896718015717, "rouge1_fmeasure_stderr": 0.0024005443718459487, "rouge1_precision": 0.12940832070901992, "rouge1_precision_stderr": 0.0019943586762260035, "rouge1_recall": 0.2884068479099661, "rouge1_recall_stderr": 0.004068894100326392, "rouge2_fmeasure": 0.02723037446755515, "rouge2_fmeasure_stderr": 0.0011161293152371049, "rouge2_precision": 0.020122251087519527, "rouge2_precision_stderr": 0.0008493738964290155, "rouge2_recall": 0.0463800028049885, "rouge2_recall_stderr": 0.0019308344795767856, "rougeL_fmeasure": 0.1247856962494059, "rougeL_fmeasure_stderr": 0.0016915785603912935, "rougeL_precision": 0.09345653613534448, "rougeL_precision_stderr": 0.00145180399823862, "rougeL_recall": 0.2091744165096173, "rougeL_recall_stderr": 0.0029753866994255977, "rougeLsum_fmeasure": 0.13664310066002217, "rougeLsum_fmeasure_stderr": 0.0019261086832577496, "rougeLsum_precision": 0.10212955921043831, "rougeLsum_precision_stderr": 0.0016013787895265638, "rougeLsum_recall": 0.2290005827276144, "rougeLsum_recall_stderr": 0.0033599851151365936}}, "4": {"article_DOC_summary": {"bleu": 0.5019536886003719, "bleu_stderr": 0.1343611351129069, "rouge1_fmeasure": 0.04539068876881627, "rouge1_fmeasure_stderr": 0.002529463308822854, "rouge1_precision": 0.0373879533361559, "rouge1_precision_stderr": 0.0021810464397006403, "rouge1_recall": 0.07150811812236044, "rouge1_recall_stderr": 0.004101431121761528, "rouge2_fmeasure": 0.007032145297330701, "rouge2_fmeasure_stderr": 0.0006749391536461736, "rouge2_precision": 0.005550765385729703, "rouge2_precision_stderr": 0.0005963003468727854, "rouge2_recall": 0.011310401420282012, "rouge2_recall_stderr": 0.0010721548649813347, "rougeL_fmeasure": 0.03322213103634567, "rougeL_fmeasure_stderr": 0.0018345484180096144, "rougeL_precision": 0.0280016015013484, "rougeL_precision_stderr": 0.0017038515915968166, "rougeL_recall": 0.05214073374869573, "rougeL_recall_stderr": 0.0029695500586895698, "rougeLsum_fmeasure": 0.03607224322510311, "rougeLsum_fmeasure_stderr": 0.0020071211692870355, "rougeLsum_precision": 0.03019679894521189, "rougeLsum_precision_stderr": 0.0018216600106999053, "rougeLsum_recall": 0.05685075214207904, "rougeLsum_recall_stderr": 0.0032708994661166087}}, "5": {"article_DOC_summary": {"bleu": 1.0120083486806341e-43, "bleu_stderr": 2.299599307531863e-38, "rouge1_fmeasure": 0.001950949795538486, "rouge1_fmeasure_stderr": 0.0005800061914629863, "rouge1_precision": 0.0023010225042523016, "rouge1_precision_stderr": 0.0007056279408099138, "rouge1_recall": 0.0017639670878076587, "rouge1_recall_stderr": 0.0005179713630676667, "rouge2_fmeasure": 0.0, "rouge2_fmeasure_stderr": 0.0, "rouge2_precision": 0.0, "rouge2_precision_stderr": 0.0, "rouge2_recall": 0.0, "rouge2_recall_stderr": 0.0, "rougeL_fmeasure": 0.0014822281925852424, "rougeL_fmeasure_stderr": 0.0004217162689453353, "rougeL_precision": 0.001755708684944675, "rougeL_precision_stderr": 0.000517656162281774, "rougeL_recall": 0.001338960546022285, "rougeL_recall_stderr": 0.00037496082953111386, "rougeLsum_fmeasure": 0.001529874466646611, "rougeLsum_fmeasure_stderr": 0.00043483560412767216, "rougeLsum_precision": 0.001800847260371234, "rougeLsum_precision_stderr": 0.0005272819939622312, "rougeLsum_recall": 0.0013894095420872634, "rougeLsum_recall_stderr": 0.00039142547685255293}}}} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..12a908bf1ed2625a57241559271f694832988b3f --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.3035990566203564, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.025090566187709752 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.071329758776339, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.00279942361165936 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2777833537640477, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005021363310584012 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.08651516220636073, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018421075247631034 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.02493593159722908, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0015907952635559632 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.09479553172438937, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0029506060980076265 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.029457430490114032, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010438331217221088 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06175148366384243, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002527555333736909 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2437824603111534, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004509160724470269 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.07406437697939146, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015395345437139562 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06515539016564718, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0025912111251545702 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2540442770643496, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00462671195388165 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.07865092467105374, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016703135405487922 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..e4db207adf3b6f338eccf5c5ad3ff0a1c48647c2 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.425747629657599, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.019098717536100474 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07869000641860335, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002574141434973694 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.27911697917731965, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005025828797632534 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09915747457632551, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020735345455021683 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.028711039922457098, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0015895748345510915 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1016349747426781, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003064263260383757 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.03553245669340435, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012297768666432714 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06784822137078164, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0023584286957804 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.24104415879973046, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004392721456408033 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.08430815534591073, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001735358065989058 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07247904169290792, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002450321126322307 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.25603235118880574, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004615086249365793 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.09052335683054723, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00188465696521615 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..6c7744b93af3c4cf283823532f5cc6164952f2a7 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.4497583704772655, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.020681936257570407 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.08676474022374367, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0030356563200589527 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.28565036099040625, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005160364852348898 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10711351422120703, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0024517943039154802 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03205343730461677, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001723196140481487 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.10665226766319001, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0031321051228955267 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.03910067067467762, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0014210269756776363 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07292425907812133, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002682288331233897 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2418993456910343, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004387413324828132 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.08897314932870945, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.002002929328501285 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07776458484873876, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002744825042381609 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.25905556991925294, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004682330002575584 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.09589616680302177, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0021426419270798853 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..e90fddc4df36d05886dcbcefd1181b19f779c590 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5453566942766312, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03174339868079995 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.09141520582826082, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0030271528036140147 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2946460917400917, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005150457597998139 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11381502730552777, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0025266791277412273 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.0349533732864018, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0018089338825247128 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1132672221907378, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0032322633657986535 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.04302598363295129, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0015803110546547487 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07724838020684321, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0027324213899579644 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.24881404393817505, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004406171113605123 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09476653245926525, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.002130119160105199 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.0833829754674534, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0028479312887177617 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.26789842816421516, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00469224168355405 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10301268965900799, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022888513790911423 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..9913f99e03ede74495b381e1f511866643b9c218 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.552842738936437, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.031220316118742313 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0904044344997309, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0028870247747819445 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.30097906504674915, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005237112327131232 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.1125896095390658, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0024441626752801536 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03357915742500351, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001563192087212674 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1186975703608361, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0033758949815214734 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.042594714406787165, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0014574874865349483 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07544711584950896, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0025299603142831984 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2529660247399177, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00445147947055177 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09294924226115779, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.00201851881067649 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.08174948336092744, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0026566402566456145 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2733792203624409, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0047675031230854 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10127472230162189, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002166709168455675 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..a5ba06acf21e85d1f24fea91c931140733745c58 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5160808451457419, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.028152585581808363 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.08756298477917958, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002702960483622272 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.30943226003927954, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00537568452081882 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11267246257206415, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0023161203363087435 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.031279144513968335, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0015413777797901 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1215282455226915, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003458287142794445 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.04130600915194189, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0014050088099057468 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.0727149677685351, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002357535066892359 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.25979581419981984, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004554297207344822 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09293487391814521, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018937867038700312 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07890883384983154, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002452737865418059 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.28252744959181614, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004927414464655944 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10164495184500182, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020419190457151644 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..80af18735d9b1e894ca4f4c966c3015874da600b --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.15144825263093634, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001983783278782952 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.22534109695497295, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002481691416374552 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.16612440507868828, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017714330657529222 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.024905925069722477, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0006850846534012076 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.03850478234485377, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0011024526272317378 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.027643924254134603, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007121708145651539 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11125836759667614, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.00142424299423556 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.17033205247937977, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0019231978134307691 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.12276816133742628, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012192289120582331 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.14179043128628907, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018541893135933546 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.21137913675901987, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0023233022426073892 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.15558334623949294, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016443580462993418 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.159384502447796, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.057628180591426645 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..907e85e297e295f9023d676e21cf525f32361fee --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.17371296302390632, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0021902383124749454 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.24147579886101558, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0024751615706129063 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1816842303684298, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017782880793874537 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.03192092546391988, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009424962628309825 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04410602388358206, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0011954069713593922 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03265176701451356, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007878736261592252 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.12465533551452404, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015982129307706894 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.17675811341682113, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0019268394653393782 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13015162278257636, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012020872378512297 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1631041776023868, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0020525153232724904 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.22761644537805767, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0023639550060386397 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.17077057715538618, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016691467024742542 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.566708990629026, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0581496436272751 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..9d32acc85454eaf4e116aa9429d3c761ad0610d4 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.17743624737565108, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0021492258023722674 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.25150886158134367, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0024524846458276782 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.18745443354388727, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017296949460870405 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.03283000534133716, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009328095980555773 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.045825393377754105, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012602521826330568 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.033509423859662844, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007929018957245757 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.12645353945710797, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015870180893584427 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.18352284038906627, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0019514738060420578 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1336204206295648, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0011901208386536995 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.16653674072514268, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002024987535804069 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.23696286031880665, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002325990094088013 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.17608197313625737, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016179873786064413 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.5566151429887363, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.07263045479067322 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..71d90c685181a1c3de1eb8cc299775a62e5065f8 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.14740810337408072, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002271679945302172 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.20836892569223942, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0028639121415319447 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.15441643686495948, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020001231144296736 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.026151374582378446, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007896206739810243 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.037574793035193066, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0011612525965493635 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.02732982658717203, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007317865399481251 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.10492025586641264, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015968039001781839 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.15175102080784733, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0021792866520934837 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.10993608037589384, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013690145372151107 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.13823688941444, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002132419884185906 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.1956605692982594, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002692622620180876 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.14475462836497524, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018689106719346205 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.5090266791250284, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.06924033448041976 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..ff6553c182b94da69e990cc95695c1a78dafeeae --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.049482797501199056, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0019059242917520388 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.07028822776695906, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002492820928227135 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.050539802692113486, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017469478379052526 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.009307183820869624, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0005915386117685121 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.012698668080633723, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0007466714930192209 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.009189516501593525, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0005049910178490766 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.03621618955918932, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.00140538497956548 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.0526171116259514, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0018954837026351507 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.03691068397379973, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012531679750741017 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.046090930054903605, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017742451276749082 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.0656234761466232, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002326065080347693 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.0471157693901415, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016276260750980145 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.22270796928381564, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.029433615868403155 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..928f836e0d1a5f3fb902dced2a74ee31281f9b2c --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.007478271052435213, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0008063007869225007 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.010338951290674275, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0010687996383989403 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.007351567651326997, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0007412176546731157 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0013879834061599138, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0002237907618586408 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.002245934397481068, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.00039931884660781176 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0014450651061614851, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0002191123197517165 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.005604377982811, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0006037717129781307 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.007942619745679938, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0008436730401849616 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.005480459085572166, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0005436419168699393 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.007131566619622942, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0007759264592303796 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.009791040555433658, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0010166014822588294 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.006967006053774628, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0007050533365556994 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.997473456123696e-08, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 1.002855650120767e-07 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..c1e9f6c011fbdd04e44a6299eac4f1139674cf2a --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 1.309497335599097, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.023324215467998514 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.11928395058889167, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0026720430430010717 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.16222047702577053, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002573881001494484 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.12101569116712643, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0018859465533766812 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.01996887174584161, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0008462437123245745 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.02965977606050867, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001033586571455221 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.02190886095908555, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0007251164901007362 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.0972026278015815, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0024157240054608615 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.1287653818656058, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002033304125683539 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.09561805145503208, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0014452773316927124 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.1075291758702482, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0025162153224772906 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.14428075183193284, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002300879817943218 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.10772552310984851, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016823465430055036 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..91ba471431b0d98b5861b59f5e9686c1c57c953d --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 7.230957749576389, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.0536425469915919 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.34380888996516695, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0030845076484356158 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.447391658162999, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002727984781486933 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3592817925524962, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0021198922639512987 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.14545103598427403, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0019947160057053256 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.18921875166954605, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0020477910004319416 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.15054262500569862, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0015981728794968756 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2533789645650362, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002514469484712738 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.33025523426001224, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002291380183574316 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2638992015247686, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0017193130894710778 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.2918162013801523, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0027922449703006685 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3811978300988754, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026251491058964013 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3053449527328775, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002014422999339484 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..735fc8a5b44a0ce4c507bcca483d654a70b60f3b --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.80649360056355, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1998199512362247 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4618975292968109, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0033374021778200306 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.44185113042812146, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027208355753659172 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4233941396922909, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002240259708210042 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.21720316360476427, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0023932535396076963 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.20548913402282043, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0020643048503938386 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.19638166157139877, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0018136805158363019 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.345686135545352, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0028355066597269933 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.33044345883576104, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023468520325341962 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3159660620207397, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0019464502769911136 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3920117254184558, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0030921641172849523 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3756316032841477, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002600519205461284 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.35940536059201766, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0021791205035671516 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..58a85f0ebfe1825f1f141e364979fb4e638443d2 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.91307719639215, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1274857032754034 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4709595396963552, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003227057457923827 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.44897994314565826, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0026763988425963594 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.43472700621860616, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0021930927799969995 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2252611249009733, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0023859573577785687 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21265122060479416, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002077181955257037 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2054392972212338, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0018449396852071784 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.35320392511807835, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002743833223699648 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.33685020068084837, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002328588288588858 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.32543991881376977, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0019275494986348497 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4032258158403475, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0030346167857717155 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3847176304718895, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0025700421376888207 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.37211755259775925, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0021593105116151728 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..02b2d6978b868830178da39335e0fc963551ae17 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.895073995415705, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.15213341614493073 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4650093328987851, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031030240695590562 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.453603046375726, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0026544370156289954 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4358889598609801, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002183214874104859 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.21937912264430276, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002277471884890991 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21394671208363505, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021088970425982767 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2044223942588151, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0018593650607392539 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.34738539994213957, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0026340554345153535 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.33972816863194827, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002342079191640274 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3254926044349284, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0019460417013969558 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.39726620076907726, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0029189292625600117 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3877392144856795, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0025612577080022566 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.37230138483200753, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002156573551629483 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..2a9913b4dcc3a28304e0d22023723d202091267e --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.984249703645997, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.14605546972985659 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4596711523135132, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0030229942436052165 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4626551599063747, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0026402368817322257 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4394110300981441, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002155708933961789 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2193015904368128, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0022187644166033974 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.22067796088896902, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002098400156703052 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.20837071123028594, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0018180763618672092 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3420249015987018, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0025525295785147847 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3451786358998491, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023314269399147035 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3268336987119632, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001906797734845931 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.39378396094073, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002858394052035071 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3964808392544174, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0025604225420971832 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3762959528921545, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0021396018313958806 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_gem_xsum_article_DOC_summary_0.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e340491baf0ebfd64ebd330cacb1687a588a31a8 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12832828142164515, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0017794562183186251 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.28847248029120043, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003889108647255819 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17444657578502828, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0022844654329194137 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.021115950384362318, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.000843051310287779 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.04925763881619255, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0020461456356515254 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.029039326805435032, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0011554949380146165 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09350128038856384, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0012793590377888806 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.21105922988342335, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0028651027111890855 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.12720258223547712, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001648248487654858 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10200423853654914, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0013916696816987264 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2313753113336317, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0032368664660586965 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1390205462262644, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.001823510668675631 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.997655025281657, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08049545372158354 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_gem_xsum_article_DOC_summary_1.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..ed5a8615ed709f4bf9fc514dc76b4053e2a96353 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1309454764999026, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.001827765049519732 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.29700562382894197, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003795399616335189 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17768393062360832, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0022349506141921644 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02041569980816869, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0008450735436051835 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.04822240605480935, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0019777747068750423 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.027990512381062316, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001130566656515218 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09504020604087868, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013599947712725539 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2162072871160676, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.002829869659329609 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1288738749109626, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001625277139920424 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10335621277254586, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001462699625038698 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.23614329439124435, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0031713690732049172 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14046128881678455, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0017990331974292878 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.9675071405690926, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09958935593288926 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_gem_xsum_article_DOC_summary_2.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..59df6502cc472c8000e92feaf86adb44fe6da1b1 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.13326231738564168, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018541538731038265 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.30653846845415633, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003718784510021167 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1815853317619735, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0022198474125888993 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.022289828836057894, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0008725918092828604 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.05259029448210306, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0021143622321714616 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.030561262010519005, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0011776564417043847 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09606073585619543, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001320735780400149 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2222896298147904, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0027767376278209476 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13099347768064226, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0015774167795458336 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.105504826402108, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014517045288292944 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.24526632623966604, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0031905602481124952 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14421468208543237, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.001795033812855214 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.0366131861525387, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08607955425699379 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_gem_xsum_article_DOC_summary_3.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..7fbfb9824c5bdfd03e651075d62439b518de7f15 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12940832070901992, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0019943586762260035 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2884068479099661, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004068894100326392 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17299896718015717, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0024005443718459487 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.020122251087519527, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0008493738964290155 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0463800028049885, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0019308344795767856 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.02723037446755515, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0011161293152371049 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09345653613534448, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.00145180399823862 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2091744165096173, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0029753866994255977 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1247856962494059, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0016915785603912935 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10212955921043831, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0016013787895265638 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2290005827276144, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0033599851151365936 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13664310066002217, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0019261086832577496 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.0158973292814215, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.11093743610635416 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_gem_xsum_article_DOC_summary_4.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..3db1414daf1d0d117cae3fadac51552b2cd12e12 --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0373879533361559, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0021810464397006403 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.07150811812236044, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004101431121761528 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.04539068876881627, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002529463308822854 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.005550765385729703, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0005963003468727854 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.011310401420282012, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0010721548649813347 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.007032145297330701, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0006749391536461736 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0280016015013484, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0017038515915968166 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.05214073374869573, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0029695500586895698 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.03322213103634567, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018345484180096144 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.03019679894521189, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0018216600106999053 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.05685075214207904, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0032708994661166087 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.03607224322510311, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020071211692870355 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.5019536886003719, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.1343611351129069 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_gem_xsum_article_DOC_summary_5.json b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..9302b6b597ded80ce143ab3429ee3de7414cdf8d --- /dev/null +++ b/4b284b1b9oscar/evaluation/generation/slim.4b284b1b9oscar_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0023010225042523016, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0007056279408099138 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.0017639670878076587, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0005179713630676667 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.001950949795538486, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0005800061914629863 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.001755708684944675, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.000517656162281774 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.001338960546022285, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.00037496082953111386 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0014822281925852424, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0004217162689453353 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.001800847260371234, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0005272819939622312 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.0013894095420872634, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.00039142547685255293 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.001529874466646611, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.00043483560412767216 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.0120083486806341e-43, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 2.299599307531863e-38 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b1b9oscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_0.json b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_0.json new file mode 100644 index 0000000000000000000000000000000000000000..b8904e2edbd2421591350a4a90638f138f8b9742 --- /dev/null +++ b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.346, + "acc_stderr": 0.015050266127564443 + }, + "anli_r2": { + "acc": 0.354, + "acc_stderr": 0.015129868238451773 + }, + "anli_r3": { + "acc": 0.3516666666666667, + "acc_stderr": 0.013789711695404794 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.30404040404040406 + }, + "copa": { + "acc": 0.65, + "acc_stderr": 0.0479372485441102 + }, + "hellaswag": { + "acc": 0.3588926508663613, + "acc_stderr": 0.00478695314665708, + "acc_norm": 0.4307906791475802, + "acc_norm_stderr": 0.0049417488176823005 + }, + "rte": { + "acc": 0.49097472924187724, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.5185477505919495, + "acc_stderr": 0.014042813708888378 + }, + "storycloze_2016": { + "acc": 0.6285408872260823, + "acc_stderr": 0.011173814890350133 + }, + "boolq": { + "acc": 0.4954128440366973, + "acc_stderr": 0.008744686941762907 + }, + "arc_easy": { + "acc": 0.4663299663299663, + "acc_stderr": 0.010236494647406476, + "acc_norm": 0.42845117845117847, + "acc_norm_stderr": 0.010154195733990968 + }, + "arc_challenge": { + "acc": 0.22696245733788395, + "acc_stderr": 0.012240491536132873, + "acc_norm": 0.27474402730375425, + "acc_norm_stderr": 0.013044617212771227 + }, + "sciq": { + "acc": 0.679, + "acc_stderr": 0.014770821817934649, + "acc_norm": 0.617, + "acc_norm_stderr": 0.015380102325652715 + }, + "piqa": { + "acc": 0.6877040261153428, + "acc_stderr": 0.010812581599154424, + "acc_norm": 0.6849836779107725, + "acc_norm_stderr": 0.010838072746240652 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_0_lm-eval_global_step80108_2023-05-04-10-24-43_0shots_backup.json b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_0_lm-eval_global_step80108_2023-05-04-10-24-43_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..b8904e2edbd2421591350a4a90638f138f8b9742 --- /dev/null +++ b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_0_lm-eval_global_step80108_2023-05-04-10-24-43_0shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.346, + "acc_stderr": 0.015050266127564443 + }, + "anli_r2": { + "acc": 0.354, + "acc_stderr": 0.015129868238451773 + }, + "anli_r3": { + "acc": 0.3516666666666667, + "acc_stderr": 0.013789711695404794 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.30404040404040406 + }, + "copa": { + "acc": 0.65, + "acc_stderr": 0.0479372485441102 + }, + "hellaswag": { + "acc": 0.3588926508663613, + "acc_stderr": 0.00478695314665708, + "acc_norm": 0.4307906791475802, + "acc_norm_stderr": 0.0049417488176823005 + }, + "rte": { + "acc": 0.49097472924187724, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.5185477505919495, + "acc_stderr": 0.014042813708888378 + }, + "storycloze_2016": { + "acc": 0.6285408872260823, + "acc_stderr": 0.011173814890350133 + }, + "boolq": { + "acc": 0.4954128440366973, + "acc_stderr": 0.008744686941762907 + }, + "arc_easy": { + "acc": 0.4663299663299663, + "acc_stderr": 0.010236494647406476, + "acc_norm": 0.42845117845117847, + "acc_norm_stderr": 0.010154195733990968 + }, + "arc_challenge": { + "acc": 0.22696245733788395, + "acc_stderr": 0.012240491536132873, + "acc_norm": 0.27474402730375425, + "acc_norm_stderr": 0.013044617212771227 + }, + "sciq": { + "acc": 0.679, + "acc_stderr": 0.014770821817934649, + "acc_norm": 0.617, + "acc_norm_stderr": 0.015380102325652715 + }, + "piqa": { + "acc": 0.6877040261153428, + "acc_stderr": 0.010812581599154424, + "acc_norm": 0.6849836779107725, + "acc_norm_stderr": 0.010838072746240652 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_1.json b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_1.json new file mode 100644 index 0000000000000000000000000000000000000000..35f3508904f63dcf8431751c966b6be26ac45e7e --- /dev/null +++ b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.347, + "acc_stderr": 0.015060472031706622 + }, + "anli_r2": { + "acc": 0.331, + "acc_stderr": 0.014888272588203934 + }, + "anli_r3": { + "acc": 0.33916666666666667, + "acc_stderr": 0.013672343491681819 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.06633634150359541, + "f1": 0.27807807807807805 + }, + "copa": { + "acc": 0.63, + "acc_stderr": 0.04852365870939099 + }, + "hellaswag": { + "acc": 0.3569010157339175, + "acc_stderr": 0.004781061390873926, + "acc_norm": 0.42421828321051586, + "acc_norm_stderr": 0.004932137126625413 + }, + "rte": { + "acc": 0.48375451263537905, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.5130228887134964, + "acc_stderr": 0.014047718393997667 + }, + "storycloze_2016": { + "acc": 0.6162479957242116, + "acc_stderr": 0.011245591019345448 + }, + "boolq": { + "acc": 0.41804281345565747, + "acc_stderr": 0.008626774352070744 + }, + "arc_easy": { + "acc": 0.4684343434343434, + "acc_stderr": 0.010239317603199502, + "acc_norm": 0.45496632996632996, + "acc_norm_stderr": 0.010218084454602578 + }, + "arc_challenge": { + "acc": 0.22866894197952217, + "acc_stderr": 0.012272853582540802, + "acc_norm": 0.26706484641638223, + "acc_norm_stderr": 0.012928933196496349 + }, + "sciq": { + "acc": 0.692, + "acc_stderr": 0.01460648312734276, + "acc_norm": 0.671, + "acc_norm_stderr": 0.014865395385928357 + }, + "piqa": { + "acc": 0.676822633297062, + "acc_stderr": 0.01091197412428213, + "acc_norm": 0.6773667029379761, + "acc_norm_stderr": 0.010907166359856616 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_1_lm-eval_global_step80108_2023-05-04-10-21-10_1shots_backup.json b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_1_lm-eval_global_step80108_2023-05-04-10-21-10_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..35f3508904f63dcf8431751c966b6be26ac45e7e --- /dev/null +++ b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_1_lm-eval_global_step80108_2023-05-04-10-21-10_1shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.347, + "acc_stderr": 0.015060472031706622 + }, + "anli_r2": { + "acc": 0.331, + "acc_stderr": 0.014888272588203934 + }, + "anli_r3": { + "acc": 0.33916666666666667, + "acc_stderr": 0.013672343491681819 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.06633634150359541, + "f1": 0.27807807807807805 + }, + "copa": { + "acc": 0.63, + "acc_stderr": 0.04852365870939099 + }, + "hellaswag": { + "acc": 0.3569010157339175, + "acc_stderr": 0.004781061390873926, + "acc_norm": 0.42421828321051586, + "acc_norm_stderr": 0.004932137126625413 + }, + "rte": { + "acc": 0.48375451263537905, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.5130228887134964, + "acc_stderr": 0.014047718393997667 + }, + "storycloze_2016": { + "acc": 0.6162479957242116, + "acc_stderr": 0.011245591019345448 + }, + "boolq": { + "acc": 0.41804281345565747, + "acc_stderr": 0.008626774352070744 + }, + "arc_easy": { + "acc": 0.4684343434343434, + "acc_stderr": 0.010239317603199502, + "acc_norm": 0.45496632996632996, + "acc_norm_stderr": 0.010218084454602578 + }, + "arc_challenge": { + "acc": 0.22866894197952217, + "acc_stderr": 0.012272853582540802, + "acc_norm": 0.26706484641638223, + "acc_norm_stderr": 0.012928933196496349 + }, + "sciq": { + "acc": 0.692, + "acc_stderr": 0.01460648312734276, + "acc_norm": 0.671, + "acc_norm_stderr": 0.014865395385928357 + }, + "piqa": { + "acc": 0.676822633297062, + "acc_stderr": 0.01091197412428213, + "acc_norm": 0.6773667029379761, + "acc_norm_stderr": 0.010907166359856616 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_2.json b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_2.json new file mode 100644 index 0000000000000000000000000000000000000000..f60ab9758aac0cde88cb9830625ea13d3d94ae31 --- /dev/null +++ b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.336, + "acc_stderr": 0.014944140233795021 + }, + "anli_r2": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r3": { + "acc": 0.32166666666666666, + "acc_stderr": 0.013490095282989523 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.06633634150359541, + "f1": 0.24291938997821352 + }, + "copa": { + "acc": 0.66, + "acc_stderr": 0.04760952285695237 + }, + "hellaswag": { + "acc": 0.3552081258713404, + "acc_stderr": 0.004775982650355913, + "acc_norm": 0.42561242780322645, + "acc_norm_stderr": 0.004934250390879783 + }, + "rte": { + "acc": 0.4693140794223827, + "acc_stderr": 0.03003973059219781 + }, + "winogrande": { + "acc": 0.5153906866614049, + "acc_stderr": 0.014045826789783668 + }, + "storycloze_2016": { + "acc": 0.6173169428113309, + "acc_stderr": 0.011239653231976822 + }, + "boolq": { + "acc": 0.4091743119266055, + "acc_stderr": 0.00859956344239735 + }, + "arc_easy": { + "acc": 0.4654882154882155, + "acc_stderr": 0.01023531423896939, + "acc_norm": 0.4553872053872054, + "acc_norm_stderr": 0.010218861787618726 + }, + "arc_challenge": { + "acc": 0.24232081911262798, + "acc_stderr": 0.012521593295800116, + "acc_norm": 0.2832764505119454, + "acc_norm_stderr": 0.013167478735134576 + }, + "sciq": { + "acc": 0.702, + "acc_stderr": 0.014470846741134703, + "acc_norm": 0.68, + "acc_norm_stderr": 0.014758652303574872 + }, + "piqa": { + "acc": 0.675734494015234, + "acc_stderr": 0.010921539041347987, + "acc_norm": 0.6773667029379761, + "acc_norm_stderr": 0.010907166359856616 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_2_lm-eval_global_step80108_2023-05-04-10-24-43_2shots_backup.json b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_2_lm-eval_global_step80108_2023-05-04-10-24-43_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..f60ab9758aac0cde88cb9830625ea13d3d94ae31 --- /dev/null +++ b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_2_lm-eval_global_step80108_2023-05-04-10-24-43_2shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.336, + "acc_stderr": 0.014944140233795021 + }, + "anli_r2": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r3": { + "acc": 0.32166666666666666, + "acc_stderr": 0.013490095282989523 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.06633634150359541, + "f1": 0.24291938997821352 + }, + "copa": { + "acc": 0.66, + "acc_stderr": 0.04760952285695237 + }, + "hellaswag": { + "acc": 0.3552081258713404, + "acc_stderr": 0.004775982650355913, + "acc_norm": 0.42561242780322645, + "acc_norm_stderr": 0.004934250390879783 + }, + "rte": { + "acc": 0.4693140794223827, + "acc_stderr": 0.03003973059219781 + }, + "winogrande": { + "acc": 0.5153906866614049, + "acc_stderr": 0.014045826789783668 + }, + "storycloze_2016": { + "acc": 0.6173169428113309, + "acc_stderr": 0.011239653231976822 + }, + "boolq": { + "acc": 0.4091743119266055, + "acc_stderr": 0.00859956344239735 + }, + "arc_easy": { + "acc": 0.4654882154882155, + "acc_stderr": 0.01023531423896939, + "acc_norm": 0.4553872053872054, + "acc_norm_stderr": 0.010218861787618726 + }, + "arc_challenge": { + "acc": 0.24232081911262798, + "acc_stderr": 0.012521593295800116, + "acc_norm": 0.2832764505119454, + "acc_norm_stderr": 0.013167478735134576 + }, + "sciq": { + "acc": 0.702, + "acc_stderr": 0.014470846741134703, + "acc_norm": 0.68, + "acc_norm_stderr": 0.014758652303574872 + }, + "piqa": { + "acc": 0.675734494015234, + "acc_stderr": 0.010921539041347987, + "acc_norm": 0.6773667029379761, + "acc_norm_stderr": 0.010907166359856616 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_3.json b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_3.json new file mode 100644 index 0000000000000000000000000000000000000000..937256dd7b36e8a793161c20149a772d72be6e28 --- /dev/null +++ b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.355, + "acc_stderr": 0.015139491543780532 + }, + "anli_r2": { + "acc": 0.365, + "acc_stderr": 0.01523177622626491 + }, + "anli_r3": { + "acc": 0.3375, + "acc_stderr": 0.013655897185463652 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.06633634150359541, + "f1": 0.2889767237593324 + }, + "copa": { + "acc": 0.62, + "acc_stderr": 0.04878317312145632 + }, + "hellaswag": { + "acc": 0.358195578570006, + "acc_stderr": 0.004784901248558721, + "acc_norm": 0.424317864967138, + "acc_norm_stderr": 0.004932289405608946 + }, + "rte": { + "acc": 0.4729241877256318, + "acc_stderr": 0.030052303463143706 + }, + "winogrande": { + "acc": 0.5043409629044988, + "acc_stderr": 0.014051956064076892 + }, + "storycloze_2016": { + "acc": 0.6194548369855692, + "acc_stderr": 0.011227604968407471 + }, + "boolq": { + "acc": 0.41651376146788993, + "acc_stderr": 0.00862228802067401 + }, + "arc_easy": { + "acc": 0.47053872053872053, + "acc_stderr": 0.01024195772840968, + "acc_norm": 0.4642255892255892, + "acc_norm_stderr": 0.010233488709726547 + }, + "arc_challenge": { + "acc": 0.23378839590443687, + "acc_stderr": 0.012368225378507142, + "acc_norm": 0.2713310580204778, + "acc_norm_stderr": 0.012993807727545794 + }, + "sciq": { + "acc": 0.715, + "acc_stderr": 0.014282120955200484, + "acc_norm": 0.687, + "acc_norm_stderr": 0.014671272822977886 + }, + "piqa": { + "acc": 0.6621327529923831, + "acc_stderr": 0.011035474307853841, + "acc_norm": 0.676822633297062, + "acc_norm_stderr": 0.010911974124282128 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_3_lm-eval_global_step80108_2023-05-04-10-24-43_3shots_backup.json b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_3_lm-eval_global_step80108_2023-05-04-10-24-43_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..937256dd7b36e8a793161c20149a772d72be6e28 --- /dev/null +++ b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_3_lm-eval_global_step80108_2023-05-04-10-24-43_3shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.355, + "acc_stderr": 0.015139491543780532 + }, + "anli_r2": { + "acc": 0.365, + "acc_stderr": 0.01523177622626491 + }, + "anli_r3": { + "acc": 0.3375, + "acc_stderr": 0.013655897185463652 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.06633634150359541, + "f1": 0.2889767237593324 + }, + "copa": { + "acc": 0.62, + "acc_stderr": 0.04878317312145632 + }, + "hellaswag": { + "acc": 0.358195578570006, + "acc_stderr": 0.004784901248558721, + "acc_norm": 0.424317864967138, + "acc_norm_stderr": 0.004932289405608946 + }, + "rte": { + "acc": 0.4729241877256318, + "acc_stderr": 0.030052303463143706 + }, + "winogrande": { + "acc": 0.5043409629044988, + "acc_stderr": 0.014051956064076892 + }, + "storycloze_2016": { + "acc": 0.6194548369855692, + "acc_stderr": 0.011227604968407471 + }, + "boolq": { + "acc": 0.41651376146788993, + "acc_stderr": 0.00862228802067401 + }, + "arc_easy": { + "acc": 0.47053872053872053, + "acc_stderr": 0.01024195772840968, + "acc_norm": 0.4642255892255892, + "acc_norm_stderr": 0.010233488709726547 + }, + "arc_challenge": { + "acc": 0.23378839590443687, + "acc_stderr": 0.012368225378507142, + "acc_norm": 0.2713310580204778, + "acc_norm_stderr": 0.012993807727545794 + }, + "sciq": { + "acc": 0.715, + "acc_stderr": 0.014282120955200484, + "acc_norm": 0.687, + "acc_norm_stderr": 0.014671272822977886 + }, + "piqa": { + "acc": 0.6621327529923831, + "acc_stderr": 0.011035474307853841, + "acc_norm": 0.676822633297062, + "acc_norm_stderr": 0.010911974124282128 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_4.json b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_4.json new file mode 100644 index 0000000000000000000000000000000000000000..0bf0c515f00b6541e439d38d994f4fe6cfff9049 --- /dev/null +++ b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.369, + "acc_stderr": 0.015266698139154617 + }, + "anli_r2": { + "acc": 0.348, + "acc_stderr": 0.01507060460376841 + }, + "anli_r3": { + "acc": 0.3425, + "acc_stderr": 0.013704669762934732 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.0672477765493766, + "f1": 0.32222222222222224 + }, + "copa": { + "acc": 0.68, + "acc_stderr": 0.04688261722621504 + }, + "hellaswag": { + "acc": 0.359788886675961, + "acc_stderr": 0.004789575163418652, + "acc_norm": 0.42401911969727146, + "acc_norm_stderr": 0.004931831953800041 + }, + "rte": { + "acc": 0.48014440433212996, + "acc_stderr": 0.0300727231673172 + }, + "winogrande": { + "acc": 0.5177584846093133, + "acc_stderr": 0.014043619596174959 + }, + "storycloze_2016": { + "acc": 0.6173169428113309, + "acc_stderr": 0.011239653231976824 + }, + "boolq": { + "acc": 0.41804281345565747, + "acc_stderr": 0.008626774352070744 + }, + "arc_easy": { + "acc": 0.45791245791245794, + "acc_stderr": 0.010223371342195897, + "acc_norm": 0.4612794612794613, + "acc_norm_stderr": 0.010228972678389606 + }, + "arc_challenge": { + "acc": 0.23464163822525597, + "acc_stderr": 0.012383873560768682, + "acc_norm": 0.2883959044368601, + "acc_norm_stderr": 0.01323839442242818 + }, + "sciq": { + "acc": 0.729, + "acc_stderr": 0.014062601350986186, + "acc_norm": 0.707, + "acc_norm_stderr": 0.014399942998441268 + }, + "piqa": { + "acc": 0.6730141458106638, + "acc_stderr": 0.010945157126978217, + "acc_norm": 0.6702937976060935, + "acc_norm_stderr": 0.010968357083095152 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_4_lm-eval_global_step80108_2023-05-04-10-24-43_4shots_backup.json b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_4_lm-eval_global_step80108_2023-05-04-10-24-43_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..0bf0c515f00b6541e439d38d994f4fe6cfff9049 --- /dev/null +++ b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_4_lm-eval_global_step80108_2023-05-04-10-24-43_4shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.369, + "acc_stderr": 0.015266698139154617 + }, + "anli_r2": { + "acc": 0.348, + "acc_stderr": 0.01507060460376841 + }, + "anli_r3": { + "acc": 0.3425, + "acc_stderr": 0.013704669762934732 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.0672477765493766, + "f1": 0.32222222222222224 + }, + "copa": { + "acc": 0.68, + "acc_stderr": 0.04688261722621504 + }, + "hellaswag": { + "acc": 0.359788886675961, + "acc_stderr": 0.004789575163418652, + "acc_norm": 0.42401911969727146, + "acc_norm_stderr": 0.004931831953800041 + }, + "rte": { + "acc": 0.48014440433212996, + "acc_stderr": 0.0300727231673172 + }, + "winogrande": { + "acc": 0.5177584846093133, + "acc_stderr": 0.014043619596174959 + }, + "storycloze_2016": { + "acc": 0.6173169428113309, + "acc_stderr": 0.011239653231976824 + }, + "boolq": { + "acc": 0.41804281345565747, + "acc_stderr": 0.008626774352070744 + }, + "arc_easy": { + "acc": 0.45791245791245794, + "acc_stderr": 0.010223371342195897, + "acc_norm": 0.4612794612794613, + "acc_norm_stderr": 0.010228972678389606 + }, + "arc_challenge": { + "acc": 0.23464163822525597, + "acc_stderr": 0.012383873560768682, + "acc_norm": 0.2883959044368601, + "acc_norm_stderr": 0.01323839442242818 + }, + "sciq": { + "acc": 0.729, + "acc_stderr": 0.014062601350986186, + "acc_norm": 0.707, + "acc_norm_stderr": 0.014399942998441268 + }, + "piqa": { + "acc": 0.6730141458106638, + "acc_stderr": 0.010945157126978217, + "acc_norm": 0.6702937976060935, + "acc_norm_stderr": 0.010968357083095152 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_5.json b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_5.json new file mode 100644 index 0000000000000000000000000000000000000000..7ab092e9d4cf96d9781ed5439ec5f1877aea8741 --- /dev/null +++ b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.363, + "acc_stderr": 0.015213890444671283 + }, + "anli_r2": { + "acc": 0.35, + "acc_stderr": 0.015090650341444233 + }, + "anli_r3": { + "acc": 0.3333333333333333, + "acc_stderr": 0.013613950010225617 + }, + "cb": { + "acc": 0.32142857142857145, + "acc_stderr": 0.06297362289056341, + "f1": 0.2379385964912281 + }, + "copa": { + "acc": 0.65, + "acc_stderr": 0.0479372485441102 + }, + "hellaswag": { + "acc": 0.3551085441147182, + "acc_stderr": 0.004775681871529861, + "acc_norm": 0.42869946225851424, + "acc_norm_stderr": 0.004938787067611805 + }, + "rte": { + "acc": 0.4729241877256318, + "acc_stderr": 0.030052303463143706 + }, + "winogrande": { + "acc": 0.516179952644041, + "acc_stderr": 0.014045126130978603 + }, + "storycloze_2016": { + "acc": 0.615713522180652, + "acc_stderr": 0.011248538366952603 + }, + "boolq": { + "acc": 0.40948012232415903, + "acc_stderr": 0.00860054975132092 + }, + "arc_easy": { + "acc": 0.468013468013468, + "acc_stderr": 0.010238767643185723, + "acc_norm": 0.4511784511784512, + "acc_norm_stderr": 0.010210757101073475 + }, + "arc_challenge": { + "acc": 0.23293515358361774, + "acc_stderr": 0.012352507042617391, + "acc_norm": 0.2773037542662116, + "acc_norm_stderr": 0.013082095839059374 + }, + "sciq": { + "acc": 0.731, + "acc_stderr": 0.014029819522568196, + "acc_norm": 0.71, + "acc_norm_stderr": 0.014356395999905694 + }, + "piqa": { + "acc": 0.6659412404787813, + "acc_stderr": 0.011004613886336733, + "acc_norm": 0.6751904243743199, + "acc_norm_stderr": 0.010926296238294038 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_5_lm-eval_global_step80108_2023-05-04-10-24-43_5shots_backup.json b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_5_lm-eval_global_step80108_2023-05-04-10-24-43_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..7ab092e9d4cf96d9781ed5439ec5f1877aea8741 --- /dev/null +++ b/4b284b1b9oscar/evaluation/rankeval/4b284b1b9oscar_5_lm-eval_global_step80108_2023-05-04-10-24-43_5shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.363, + "acc_stderr": 0.015213890444671283 + }, + "anli_r2": { + "acc": 0.35, + "acc_stderr": 0.015090650341444233 + }, + "anli_r3": { + "acc": 0.3333333333333333, + "acc_stderr": 0.013613950010225617 + }, + "cb": { + "acc": 0.32142857142857145, + "acc_stderr": 0.06297362289056341, + "f1": 0.2379385964912281 + }, + "copa": { + "acc": 0.65, + "acc_stderr": 0.0479372485441102 + }, + "hellaswag": { + "acc": 0.3551085441147182, + "acc_stderr": 0.004775681871529861, + "acc_norm": 0.42869946225851424, + "acc_norm_stderr": 0.004938787067611805 + }, + "rte": { + "acc": 0.4729241877256318, + "acc_stderr": 0.030052303463143706 + }, + "winogrande": { + "acc": 0.516179952644041, + "acc_stderr": 0.014045126130978603 + }, + "storycloze_2016": { + "acc": 0.615713522180652, + "acc_stderr": 0.011248538366952603 + }, + "boolq": { + "acc": 0.40948012232415903, + "acc_stderr": 0.00860054975132092 + }, + "arc_easy": { + "acc": 0.468013468013468, + "acc_stderr": 0.010238767643185723, + "acc_norm": 0.4511784511784512, + "acc_norm_stderr": 0.010210757101073475 + }, + "arc_challenge": { + "acc": 0.23293515358361774, + "acc_stderr": 0.012352507042617391, + "acc_norm": 0.2773037542662116, + "acc_norm_stderr": 0.013082095839059374 + }, + "sciq": { + "acc": 0.731, + "acc_stderr": 0.014029819522568196, + "acc_norm": 0.71, + "acc_norm_stderr": 0.014356395999905694 + }, + "piqa": { + "acc": 0.6659412404787813, + "acc_stderr": 0.011004613886336733, + "acc_norm": 0.6751904243743199, + "acc_norm_stderr": 0.010926296238294038 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ab4793108f82b12a8bec8ad8b2ec20a834564c4 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b25e4140e42d21ee67a812ebf07471d1da1094180c1ecef97fd3ad8abf55cf3 +size 199058647 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdbcf496c3f67807a8f1359f1abff5e539323b82 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa77c7f9e4056df72a77f68b5cce7bfcd8738df2e8823b1617476ffcdb5685f3 +size 199058647 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..660d7f0af0402cb2c16d8b442fe83bac162ec214 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0988b23d8b86a7d952d250c8652f64e9ed33380e69f6061e693f426cb53b8f26 +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6a740228ea6d1d35d05832be70865813c2d583b --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7db07b25bca2aaffe645c877fc0eb04cd67614d9d7347231a911e93c9702555c +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e18580b64c78996e1eec9850834b23fa7c01b323 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85a7ed69ce49ec2e7db8d70406b29b129fd09da28c290901b2c50cde91cd171d +size 199058797 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9aaa483267103c47955149c9e0dcd4b0b437809 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b05e90173bd8542e3b3d9aaf6f216bd0c978b51801e195e296466f421fa121d7 +size 199058797 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40480a7e79393c70a56334f8d3a33c253c8e6e06 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d018a05a4ae09a11145397136454e9435f773c38c265c01a8f4196e54c913df +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b99aac80eb119e0a7b0cce68e96c4a57ffb1362d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7728d42678afcbf05f091dbb55f92f471abe78e7a9f41e95b825b075992b8499 +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b0ba2e06e7a9d298fc0c05282329032fd70662d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dcf3f5c733a06e4f1bca2c91ff0cf3ba650929cfa1903aa0d4dd94d87439021 +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64285412d35cf00f0673ab9d5a2753af1f477fe3 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a74e76e82f26aa92e45b61deb46fea432630d6e8d0d991240a4fcd614b21153 +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1605edd1259dd4f4a5b7ceeda7b1c091074328c --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46021cc0b9e31805724a64a0c981df3cc2da5314f1b7c16328d386542c8afa1b +size 199058797 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d225b04a1ac052e59dce1f55ecc1d8f99d3db6d0 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3151f3ebe8e0a7e433d6cb67fbc7e5ecb730ef3ad8115425eab7e84c59b4a910 +size 199058797 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba1c8473822c1dddbab6b4759b7d87221b053825 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a82125879b5d66398a0c5b6d3451e70a9bd36f567368813102c33f639ed4b792 +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c6a15b02ce83d5af0009909cf66ac87d38e3b0f --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b75ed6992533b62d0a67dcd2cd0bb2d9f1c692249c1dd1a626852057ff30e5ff +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac78d2793102e0135177ede340409677fc2b78f4 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:490e3a13a0e1184b77b8d2a599ad592af9abe338c57c614bfef9d950439c4c50 +size 199058669 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a40ff306b6762849eac89eaa2800911cc6ed963 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20207f6943a0d819aa817c8e659e5bdb7d5461b45c53b95cc73d7a0b34219d65 +size 199058669 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4c674b2ba69dfef9eacad76ce789e42e52785d3 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08cea737100c9baea63ba513e38f0bb20eaa859541da01507c0aff25e6c1a2e2 +size 199058797 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..044aed2f9ef59d2afa246bcd7bcf1185e3900c8c --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c7d38c850046162df72016bbce1a68469a3d75d9b4e24966b05cab76f763ce7 +size 199058797 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e74b78c769b257fe5ce3c026185dc308a34a9007 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba8a05a33b26ea4764b8082831c5e005ee60bc9091dd5e4303a864c8402985af +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a47131381a9941950074ad2975eff34f6b697d52 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd803eac42a1dd2ac9772fe73d9307d679bbca68015554a19759abf819468250 +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..208119929857a8892bbd3ea30b302e6978c1e9a1 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:368fe3f5203f39ab43c006078bf759209213aa197d4abd82f07e0ac98510436a +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ebfa154d00fb3dcc629d22c78d7a7be1582f5d6 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0a6566c44cb9203db660a6bb1240bb7f89b1296b8302b74106c239cedafaeb9 +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8620c740e802aa7cbd2d13a638ad6c391d0cda12 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bce75d2f753fd60abd03e9f3030bef17ebec99121f716f135ef0f3adb3e0c741 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83286876beef27065b0c8e238864a492fcf5927d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87156756c437608466e3f0636b6c1c8da763a152bf135275381a166d7d7b48b5 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..caaeef3d7a14b4e524c86602c8ce83da17742b68 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6db03ba08d2630a7e1bd379575c909bf26005df61fa69de11aea770e52f66200 +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2e28dc9f02b11286f0d0e3429b2d6f4e4e03212 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed548c89937924d9de20295737a4bd0a832cdff88d06dcfd825f327e096df1ce +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd3546eba304eb230fa1af2f09232e9fccf471c2 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efa58d1feafd61f60bb4b30755de03f284ffcd97c09c4ffe897ae04223393e19 +size 199058797 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e84880f85cc7e5be4d207d3a31612fa1f8419a0 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe5e3ee5df0f9408aac36dd5a4e9571c274dc13d81292bbd4c358b45ed410823 +size 199058797 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b007ecb3d07f6513790cce8d8ab1835c85f7207 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e40fdac046e58e5f196b97c7614dfd97d134f162782d8ac444cbef43106cc6bc +size 199058605 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aebeb3c0713ffa4fbfbe8caa68305148659ad374 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c95c44eeac533739610b8dd4875a2747bd4e500588750f2a5bbe6231b4a70e8f +size 199058605 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..296f973dac5903d4a03be1f3f8ae8bf42795ae70 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2c699a65cc94fdfcb3249a60bcf07650e941e0c507ff4bed30418ab732cf27a +size 199058669 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dff2e3aebea462035fd5f6d32a307bab15c6a87 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28af67a1211cf229276bda4a622b700ee30ec321916c1e7ba8b4bf419d86ecba +size 199058669 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7682077827650473fd84189487f5dcde75c16040 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:115438233d6b2035e9b7ba351387cc013fbffb8eb49af8c8055c16ba2d9eee4d +size 199058797 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..539693d120f83cd7f6cbbf438e54670270642896 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46042bc325d1c061c6207488a44fca922488f06e2cdc8d559fad571078486d76 +size 199058797 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c09d2e7d1ed12208f16c15dd6e27728d9400cc5d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50652cfed378f9bc8ba6388f1cc51e74d0931aa8b8980761728cab897d6de1f2 +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ae29082b0af70096f5c6b2e7e10e046713709bc --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5de487f5043509fdae156e6d55b7cf89b18b5224a6125fb7bb8df5778c37006c +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29a72ffc766fe56abffa2ee6af0a1ea64b250ddc --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d9457f6f9635ac2d5cf1f7d44358e24728e0363e1b7c1b0552be63079b5600a +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56e1d2ad249d37fc0739e33f512d9a7e392a7bd4 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c05d87aedb5c7bad0477a091bb29e55e4ed52d71eaadff70063707f7985e9d6e +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1067b3f3ea14d7237c9893e60b77b316636b64b --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41265118b1d07c528b857d3b9ad4a83a7ae384052b28b575d5aa7fcd15d0c74d +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..803757474dd041b848ef48273829dafa29692d28 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b90c33a854009cce069c17e44d96b70117e40b5997ba0303c8be063ac148291 +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72fdcabed0edbeb8e58a7491c9e89c21604c211e --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a3d8ff38a59ee93185b98c1ce3bc43d46f6de8753bb64403181c6e64701483a +size 199058797 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d9ec013cfae69d5ea056e92e895a8a17cd176b0 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fa5d01fe30b48e7d2696f7341c73de0f41cf668dbbae8ddd4b575772580bc0d +size 199058797 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccc947d5f182b31cec02919d00ae70565821142f --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b82946381fd0c62c4e3a486f3bf2f28c32fe398fc7dee8928fe89a273437dbea +size 199058669 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6513dd5b5bcfa5a07f00cb3047f0a5d19e3af99e --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f351eb44a18f2262928d7ff3c53918fd2441493feddc8e5b8ce74af344edda8 +size 199058669 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2a408acc1e1e1606011c327e54d1523279282cf --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21be72d141c36c22309f83f598bf2432260f96e527d441b5cee77a29146b57cc +size 199058850 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9083a103d575587aee7e89d98deead92a8a0de91 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cebe856d6828ee5622d6ff95a8f8bf288a70ad96cb5acde8eb92810ccd2c5ed6 +size 199058850 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2b3124881c469b1bc0eb3c88ec6ae87da58863d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49188cac7b7f462d417324572fad9cd2cbca14ce45624900250275ffdbf5ddfe +size 199058669 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a83a3d53e727e8d81369193eaa296fc41faf71a --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d45505fed06bc60c57c55b0c95f518a95f6aac4af8ebf729154368e1ba732792 +size 199058669 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a91db5c2f2b83a5a119ec395083746e1245f83dc --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0128fb4745aa86e91d7980b60f4cf2a38768ee39db5545a36f3af14bf764f3ce +size 199058797 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b0c2ee3dd8cf2f1c87484518ce813afaa7d525a --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d12be32b6874316d99e1277186fcbd9a691a3c6950f0150f62085a92a7edb18 +size 199058797 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de9c88df87ee3c343edc83c55291c7e85f136070 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47268e9b8c55bd03e2ce3747dabf57e574ae2e28a5caa9744de07bcef1a53bcd +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..989f407e6f4e78c9cf29c7d1b1f8ddaf34e81155 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:688b4de6936ed1de5b9d4f026ef094fc6957d2d97c3fc4cdfcaa2a71367ab951 +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfad40e3336b5c976357c954c9807d15de49a1eb --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96ab37f8328a2cb56e67b54d19c0dc0d2952938458262c130eb700a1ac43e824 +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85d10e3ce487bcad1867205cb0c31cfa732a41f5 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e3b3bc4e99546522834b89cd4fa95c4a3fd1b1c339fd2deca4b3f81b3779040 +size 199058733 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6836d39e0fff69e66394db756147fe88179c4946 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ba11825c27f446c828ae39139597a54fb6ab9a47dc5d1eaca84ac4ed753385a +size 199058669 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ad51ee10dd348f440f2f19f3476a2a047079cbf --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c36f8507a2593590145822daa626e6b922f76e633f7fd18204130424e97f7ef5 +size 199058669 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0a94202b952e6141f98af52b288cbd17edccc2f --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7dd42a3950c520a163e559ccebe75bab134a64e4cbb994f9f93263c76baffe4 +size 199058925 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..274a23466866063cd40f558db7450dd54ce8073e --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78dc710768e1ca37329db6bb02e335039111803438311599674622970b83d736 +size 199058925 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3e9bc0dd42b0577ff635cdf4d9d0b6c29f0f3e1 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa5d56e1adb509510906845443cd3b20644c2282d16714eb7d0c154c2b6a59f6 +size 199058605 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1f9823dc6be8ff3219affdeba1cd6f247b32394 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed9361a6ec89f19f4c8536b04b22e310be22209879b0aa7b1ac8daf5b45a748d +size 199058605 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c6cc26547bf6816eefe9d524cad028d70d93aac --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3ea2c747ad0cc02d7153941a70658fbb11381e71310ae380f544e22bb2960eb +size 199058605 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..093d28593f174936b8131e3bd6f26201ffdcae7a --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b5c62227180e95bca7e9b1c5770ef052a700b9ab2b4006915c9b1c5132734ac +size 199058605 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f490495eef37465d7b34ab6309d7777f3f1e83d2 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12627d905b6e0252d4b76cb24c7743ae1efe12b8996ae2e0bb48493a22d0c259 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6139f2c1d1c14b6d4cd134ece29d8f9a6aac80d2 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c54da59c782a4880d5b9e90bd85e8265226dacd8bac04be55dd0603f194aea53 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97b1eb23c128bf9eaa64dce481727b6f802b6f34 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a53067297e91fb2cbd1563b19ddf5b898ba8b7b2059307868bad811a9030905 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cd10459e94bcc1395c88e2a13b3666994c7494d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6be24c7c90667fe6e5eec5952cc6ac4fbae5ca4c10ae10a619378040dc133146 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f18a14f4ab9cc081b5f4da5b99f04cd5edbf7eb --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7001f8c7e52df2950275116d8db2227018a5c96d3bb2b855581609aed4fdc98 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b674baa99ca5f5216162941b8e26931632c8549a --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddd3f09208e03171cff555c9173c00dbd394b4e4cee1f869de98ae7a7fac6283 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b858be267781f3168d9f8a87313e5c3042dee317 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:513d9407f04643fc9ae401d5375f72ea43ad70a7d6a3747a334f638961805f9d +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f041cca9e09ebd8f21046a7c18e553eec11d6b8 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0917d5568e732ad4f6ee8b68184ecdfc78cfc6d15f1f76646f86a6778764ccb5 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f9ad3f7fa9c6e341d5afa0b6731ad2ad7eacc99 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dba46487e4d68ee5633f7c6294377c25eab1e4c7cc3d980484c217063672b36 +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..398b01ac3ea9eb883109450c6c1901f7df046ab3 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8b5130f5a1c7ef9d1589af343937214a3e918aee33625280c3f3913d24f93de +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54caa5c2ea68543bf99a5f3d14874c1e6b8737da --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0df1c91d2a0984c022b3b26a655a957d4809a267282dd9ad771e66eb2be62ea2 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e83b35a94baf2f412fc9d712ea68175deb34716d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce20fab4a4e4ee2a9c37dbbd6bc63a80f5180aba655e4ba1e75728ba690847ad +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ea72627e5d47d060b2930956daee03f44bd86c6 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd0f5fcdd4b10c85c7f43eca50cd9f187572ceb78774e9d652bd256c60a09efe +size 199058978 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2b0ee80510eb329a0b044d899ab8815e8a5cddb --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfa811c9a0909afa7fde00466144c286c6e0494633cdd2d53f7f555b0c0fbfa5 +size 199058978 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ada6a36f858129bcdbea289823e881cf163f28bd --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9fce72696168a6bd3aab2600aa9bd28f137bff98ff921f996d78eff6b68cf06 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..530eca88b097b4f722f73cd7e005f3b3d1241b73 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63c5c4d5331bfd225a2c4e731e654c7b423053d7c7ada3ad746043c0e8756568 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6db30f3c603a2718ab906c1f7bd201d276a968d7 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdb45763e691dee8efb7fe71b7461eb51960048db13ddb8d51d035f4262b3370 +size 199058647 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d9208f131c69329b3efc2d24bf2cfc32afd2711 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bcc00f1ff9b7d0d753fe694e9d95deb9d9629ea89db2688aac3d95b9b3a1947 +size 199058647 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f90b22d6d283e77450f85b27a49fecb8a73cfccd --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37ac79e1e06b8bcb358f471a539deddf8b95b09103b2178007b7b8e701f88f3d +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc03f3b3add4bae1cc6ecd4186534886ee7b9f25 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2710d1282efc80aa1726481d8078b263d9e5c8054c668be4842d485efe535b7 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..462c7372b369560ce7248ced2af944f4edb54d2e --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1d94f490379c2869326e4598fbf4e618b3ba6b58a11e5d81efd48cc16324165 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..909da8a890bd6665dc9dd28dd95f38490fb9cc82 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:263e1e2215e14164d3d2291206081d88f08bd9ab9b250767d2da962ddb0bf2e7 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3339da988661577475070ecf4fa6b27f30fa25f8 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c7fe1b1d0aa347f9b473ac95eade7d8dff1c7ec634f128ab847aca0f614b7e6 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6b03e7706e5679a7ac2e0becaa130ae2d7a552c --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:257bf95828558e815b1ef7a86c8a438aecb1d3ccbc53dc4e0daca0dace7e4941 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74db8a42e6e5ae8433dadb10803fdd0770ab4010 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95280070f15ded3d701c5a0e815dfd3a80d2857382d360c6558c48ae71a06168 +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5e05c14b7aa6ae131a65c300faf52c78aae3413 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c226e71d36c6e7e25643b929e512b27ce497ec4b0800a8df3246a11fca6042da +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eef529fb5246cceffe4b1d07af962c2e976e0a15 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db9f668904d4470b312cf8069635f56ff3433f832ff07e09aab9225a7144846a +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..714ab5979f6fc6ba64f2d7bddd2507ab3c998927 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acdc911c0b5ca6216189310994ff7915240a0fe509c8639fc82d2cf8992e6423 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce9dc940b2c70df38daddd89039ff6fdf5dfc80d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee0555539de25f0a37a4569b2fe88218e897858ba982e78d6020aaabdd009401 +size 199058850 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a677e14026b656c1a3ee995435b3866c62b7500 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc14fbad6169d20d07066cee5e46f3f816b8715bed99c0373a9e4bd113e1c4bd +size 199058850 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..756c690f1bb48e7e984b5ddc669dc0f03193c0e0 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68729d9584b43ba6840fbbb6889df9a6b464ca3018c34da622ce11ee3e3c8f54 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c68553faad124d73e17d3ff472c9b50599575f76 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46e881d59124a6c7717515140b6092cc00b0f1c631843045fce284414e83f895 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..218b7b2fc17897c0d62baef9d5d3039198adac57 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42c780314d971af45e4ff543635010e8a349bf0cf970425316fafcc54b3de0ea +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d69745b3f6916548b7d907f85cfb973765665124 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac9662cea2efc8d7a089936bbbe1265f978e72e5e0c2148be9fe4e171ba283fc +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a88777142d039a70f2a0f04f14bd1bcd26a72f7a --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcd6d563cc037e4be686e81d236f3ae6bdfcee8b87a0ee87eaf0a355586c6631 +size 199058594 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d20566ecb852a5586f89641edc9a872a5fb4b862 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4be1f7c04f4392334e6cb346be2a5b137a19c7006e36876cb68fc6ec8a95205e +size 199058594 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab47bacdb5b48177973677d1cbff948b3885f214 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11a21c5a75b8c8078b6c0cd74ea43c8b9b45abd1b28e42e37d6497f8a983c545 +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d68c67d6cf853c72b45db7e30261443cb1e2fef7 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0a1f2408aab00a6c3f7e69fec955ac283f2d8cf8ad8f56049c16ae15714e24d +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f77c6f968fd355f42ea02187c52f1c57f6a6636a --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9418a242b0d2868fa061ec552004f1bcc2042c8c2c89e87f8b533b044f7ff22 +size 199058711 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ceb5a316bba39ac2666f4e54b64ca4d680007b4b --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd92d354291540f543d59ed7bfb93408ad5047e47a9172b158c1e6f5613d988a +size 199058711 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f5ab2a47009e3f021b256c19310732058f12c9a --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16fc0e7d92390176526b34b26b3b8daac8539275c6984c956dd44ca516c975c7 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10bd6576c4163075acdf9e41d0f221523d0e0e83 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80484e2305df386f13a34691f6028b87276b271a2d7edfb57c6463db914d67e2 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..368e6fc824062eb805093bfa31a04a69cee38d03 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c144246464bff9fbb2a81ca6816858fe292e1ade1cd8ebae48eceaf685d99047 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93fe69a6a36fd9f4d72bcde182fd762b0b482dc9 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7a1c8071a119dbed3e3882bc5b6aae68382da33f2575e5ba35a3aed2e3bdcfc +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a7daaa151d3c390d5db05a471352a30b79d4712 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca941bd3d2ebdb33f2683e94e39a4c16cf7e041fbc86bbf3c3bd7fd03937e872 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc792ba8e73feed904016f874dc4701c54d8e991 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93edf94c7a39034dc249f7cde65465cb9fcd8f1d5cad7a056dacabce2538864c +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6eef12cf81eaabcc9105616289885fa31a41b5d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c61c5e137e30e68218a6f5c0fcfc766252719a8fc7f5c3a9fb71260c23a5b74f +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c98fbae955404bb832836513df350ebfdb5bb0f --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0958679f24702a2ba946dcf09b321190dc818c841d0795e83a83c5d287b73c22 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b41a2b4fd376d3cc55b7cead543098dba4504d5 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea8ec895a8d464b0d715f260c5823028e2a1c973741493cf3f4355b1d1a1b6d5 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5da4d938031c53db778bbb1677296d7f9cad05e2 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc46fccb39777a2c31914192b43cfe363fbc2b5f991c1b365cf7f2a97424ec4 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f1e4518ca167cc684c2778f8f03fb2267402c17 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a0d63b42af2ce8af221a08c9d74cc4cf1bcd39972b6d12ec1dd1607bc6f3045 +size 199058594 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2534e29c915efe64051f2b8e9f237b95c30ee77d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db9f072ed1be710fd6d7721496d209cb0d6b4ed94377572bffb27198c7981b4b +size 199058594 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b66ce9e0383dbc2d188542700fb7c2b8ac35e3d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fc004072548d84f62e6440435060f188fd3d191a85b7354fa753de78774593d +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d1daa6171e7ce8868e96501c319288175a61c46 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d8bf63fff46fb468000ec74c1fa2f83525d51d87de1e57487fdf32b1c4cad4e +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49b2d3bf8299336e9e297fb90c04c6d348303db6 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:458329044a90c87a98b86182c368434cf6ba4fe39dffb18a170dd7ecc75f09e1 +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea72c9447af9ac8987c8465beabadd2e52c2cca9 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56d6ea607b3b71270adf97b49b64df1579780980508fe45ee549b8fbf84854be +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..407ad99154a972a83a575d914865b338f64479f5 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b46d4309cc6fe151db51596b9eea833dd859965d8ef42f8e5d10a58936db9e74 +size 199058850 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..832ff706724b98444befc58bec0cd2f8ff7b2976 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c15b7c64158309952357436c74ed297ff7ff5cc391dedb9b48c32bcb004ac13c +size 199058850 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32c22f54e7514cdf00884bd335576b8991e5fb17 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d83b050ad8f797c86ba3559778899573d635cabca003379c8e311a05e6297c4e +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..daebe0ff807b5ac254a4abcc8abea487df3cc812 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea6f5cfa773ca0e4b2779ee592b13ad859c66591ad6eecc4687421700694cf1a +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1ee566a4ea32e7bfae918100a0724ba9f91529a --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31451eb9447d9d0b26d2d369d482bf2c5de110a1ca257e40203f1ea1e934a11e +size 199058647 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8bdf76f4ec9b43892346f7974fbecc1851ee458 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef0d3bc4fcb08eb5502f093ded758add7fdbd7dc37da99a76ecd0e7ef60063a0 +size 199058647 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24c45b023283f533243e27d9164b3183d48277ee --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:368f3e0c17039f214b7138d97a9eee984e5487be51e958619219a3de209dcb6e +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3e6295f79d154d900fd9ebad0d4098425ad3e27 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:854b6537b8eb18f1cfd7efb6bab3bc74f6435a4115df4185aefb351d47c28305 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bedf9ec0206a4f9f1f1f309eae20c2ba095f6271 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8edbb0d26119cc0d1bc6fd3decf0b53e8d7c9e2010c980c7810a1568ac3ac9f +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aaab6d34e132939e2609947985ae0d86be182844 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7dd2da85612c89424a3cdb43dd5b55e3bd88664bee810de0d4f2cd4292f782f +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31433db3844fcf554dce8587b1845af57320a375 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bee1ad0e3be88244bac213ccad8279bf23afc8a422ac9511aff8d08388758d8 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5edcbaf4724c6c001fc8f52fe3dacf32420b019 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29f091a6073ff1ab60d06ea46f0acab2d678a6f30af093ef5265f3808738129b +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e452d12fbaa93136f0e406512c94fb8cdd62ef9 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cd5fdc603fbfdd79d07cc50591fea3da15b8e24c18ba4c924696a06656f4b57 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7764a93fa8006e2a13c714b38386d349552e61a9 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e0b94f735bd36fc5e114ae15dfa00b5edf4d4f9bceb1439ce0adfe7e0e4e6fe +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7829765c3f28b2ffd6fa197e179453c27a41ff29 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7d5a1e96ecbbc21413084f7bd017636e353823211638d47893411067bda0b42 +size 199058850 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23bba3a6fa16ac1c10e21ab04cf33439c2efcd1b --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9eab60fdd7d4fc6928902cff042b98515f6148f3175b729343fd14b5e953df6 +size 199058850 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3e66d5562dd46cfeaee8545e5dbce138670d92a --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8c4ad8dbe7617a33b73866c62877bc2fd22968b19b406d79d4338db0a933f48 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a48441a275dc38b8ec7464bd708ac21b63e96ea --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99d61b476a868cff13fcd1e581449c70ff6d6df935b21051eae27d67b31b371a +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f293892b6eab0726362bf4467d87aca3657b7dd1 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67ae3de2b9997593251f480dd5705701cbdc32943ab387a534eddfe3a1c4c79d +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5562b9153c0fed06d256dc0b68806444795fc02 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e6442b4295dc0864c3066d011f82f575a2af0c71335adbae11b978a24247f0e +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ee85103df0799135202ff077a4ef82816a43baf --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea98655c5aa5495027ebe49a0720b2e0e6ed734d014b1d5c07806e40633ad991 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..313c507f579845dd705a867fcac9dcfb1202d856 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8fef29da84ed0d7123c38d8c76dba354bc531903fa9c1a9fdcd7cb741f66827 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81391372b001637becce00d68b12340c62f2a162 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32faa687ed23cecfe3d2212d2c8cdee83d009e77232a1ab44d5d390ab535e185 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf356012d6154267ecd3d301b0bc5ccb36acff73 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85092f5c11af03de6117b9ac61a490dbc15faf2a8154788ae5a870e5e02b27f1 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92c0422d2318df496a2004627f121e7b26d14715 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40e0ca3c1ee2ca68ae81f9d0f89119b78f2d6aeb862207a11773b9c31a53c5eb +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02579046f148279121c300af240aa285879deb22 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d4ca2e2c5a30cf21f1c9c893e85b95a0dae0a405bea54c17e3c2ff6fa40ea5c +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..086ef5950b47c3a3a58d725444a11e5f8bfc38c6 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a6601e64a374fd41075877ad4490de90b1005302432e7563189f55eed3aa95b +size 199058775 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b67f803545ec82c48b2f866b286ff6556b00d903 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6afc051a84baad7133c1e269c69d0e271a74d1722475da2cdff1c5855b88f029 +size 199058775 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f53857ea43fd9c85976a33688171ac0641f43e7 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd7c76d3621cc154669e5974a0053be0ef38ab98ce7d870c9f059d36a4dc2bfd +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0111af35e60f38a7cf5b3ed95a732e7d52df7194 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d744f6b45487749caa0d396394b3a052e75f1737a616fe4b3cdcce9d3068ff8b +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d463ed02b03d1715f8a8b8bb70c6e207879d7e5a --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:576b1a6de14f338661f5e48f9853e83233b4c296a893106452c16a8ee1c31e3d +size 199058850 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d59d4271ccc6f0b0ffde9fb4e7fe89a68734dde2 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb7db1ca6de827fddfe1747568580d67a452037258a1457fb0b78af5250d976b +size 199058850 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f47ea93fefaef4a3db5172028a3c39ff2a8cace --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd6ad11472669de3010d7172cc0e347a397caa7c408ccafd2aceef000d4a2148 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bae7c2f7c5fa518ac10bc6e780e8101168408d83 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:156d5e9d9342c88086e0295aad2a848251be9a69631c363cd2dfaf26de7f466e +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d2b2d272de11ad36471f9cd43ff473906c47d69 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a077b4df0bea2d8048cd520632f227cdd17419739a0f2421cf131a825f3923f +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2054eff16591614225773ddf5a0772d80498ea30 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73c4f1a96536d1df0f074cbcdf9e0e589661ca79df17348234879f9444610791 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b8a35cb27f6215ac66fe9780e4d86a722b908bb --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1568505ba483ba5620ab749b2513d50ce84124a433e764a45a661677200b6529 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d5faf6a1ef819592d68510455b72c5ab6d18e1e --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8410c27a0d08349d42be9caf958c785e926a19905733e58805e16d1f979b624 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..adfc861c332b771613494378f5a12c6c740415b1 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10816a63aeef4e31472386d7292588b93600e9bf068036b11ce30b44f605e3df +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd99131b32bede662bbd0aec1f3221141bb09d98 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bc216443bf322fb4f98468fad1dfb87903c49c214f72f36c8c8e2407f21a7e4 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3faa757390fbe4ac54bfd6d3e62678eb3b427d55 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fe2b129d6688c24494e1c2afde1506242e36d420fd9238c78ebf0eddb9b5b29 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2d3bb1bb5f107b9b837423c90e3bde18bf1011d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b99a36ed9b1c6091407040146d36c927a3503230d20a0d7d756eaf1d09077d46 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd4285162e4be92af5d80f20ffb5b5aa47700cef --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d94acb62dd05609df240e87220955fd4d1ba2f3b9e76cd3afb77e7d82428cbcc +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42d50148496a2c88bf4e938e5d7d92b8cf3344ef --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bddffa180e46de9d636baa41bd3daa7f317a3331b282ac3c29d7c32d484388ae +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bd44f5cdb7bf5fdf0373c70e12da6ef79b58cf1 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fd8bb26ae8577d02f70fb445e817ed1ba7d78a7c90a61024e158fe3f98933ea +size 199058914 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e178361cf56ab4bf9102e730275b34208220b43 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1029d775462a3b3b50ba722492aa4b74320cdacf7b94a37cb23f775e5f84a4d +size 199058914 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d5ac02bcde022169a7055ecaa5fa774e45a5a84 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07e9e8d93afbc423c527d836b2585a9b7ac63055a7e75b986526ba74b2717a73 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c979ef353069bddcce292f637a0b0957e7432005 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f3526a51cf9fc8e2dd073e10822d613432dcdb9bedbf030b90a82010f0dfd4d +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdfa805730b55929fbc163401b45748a3f08d5ea --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a10a739aedac37c71caef5205fbc4863ea486d76f9790b7e17bdf5636134dbd +size 199058711 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cfa55e289c2afeae8954dc55023f606f2fa4e1f --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9465c5c470017a9567d91315a3e9946904f8989dc4d7a0a1c11dd88343f6ca2e +size 199058711 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..077c0c3cdeb1e4b5bb0852900c8478be4549238b --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e04500f95fe0e30e3f93618c257e8ccc57a68ecfa785f8742c2f69e4499bb26 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cadb18b5eb6111c13a866f53704fe84eb09b296d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:814633a17bbc088a426045f88e5bfaabedeae7e75d3c49585cbb78a5e83d3288 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..043d6eb8a4057f318b38f7c9bb1a2942b1a50e2f --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a8e7f56f686a2d227f63b62fd77e84d8418430ff953630e36a76b4b2e0420a3 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1db3761f65008bdf9b91f6d347d274c9b242b943 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:270e6e06e99f4aeca2e9af7fe6d8fd48de927e4d0876060f0aa3a7c07b4bf3ae +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4070d5d09df3984ce2dd6d0b37d625361940bf8f --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbd461dcc346115b62d98426f8218f33677436cfb0e6bd40e6aa5b01024791ab +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b24a7d6c92e31c67965d914f8cdfad81b765437 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84809d270ab5b0e38165df317b7709d4e4b998ae098844669b4bba47e62c8d87 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e2879e642e1bb4fc8773b311e93998e292c9ee1 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9148a09c9dffdff2c86dee451d52ef016cf8c116343ce6d92c37d53518083f65 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e9bccaf5520babd1af9d78ffe059b052b189ec6 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e9118902f76fa4e723713f99989599db58620ef83651fb6cdabd860841b0c2c +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9c08ee8c49e33e264bc34338fd82b519483e7c5 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d047ef9b1fc19d047430b9d93b1f91e786a48a5d6bd0c9f428d26a7ac18cd6a +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d9402070858487e221645c6930f76d01274aee1 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:632354a9d9d0845ba3c20b602abff6a229666904ebd6c2e765a65e240226636b +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ec23cb39e938e52615ec2d5d0c239c2a6430f24 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62d90b237a1a37de3367291004ab137e0cdfb6a543a12b9452ba25c0703dae11 +size 199058850 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d901aa40a691086bb9819414f590b33962d48d93 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98119a0b9d00529d133d6d6bc677e4ea93a7b1b6e688a7cfafb32d5e86dde221 +size 199058850 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92f3a2fbe070c21e67638d5b290ed3f1996e603e --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea95cb46310eedd11c7cf3aad9161b22a753e9910f757ab5215b44bc42575979 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf751b24a45a9123ba3fb95b83fe50f592d19205 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:162d40acee9b7701c9f80bdb331694c2d46217084119d56886b2c96a54437e73 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a3fa6addada65d66cc1837b46c2bc906c533071 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b82e12c9cf75a34dc789a35589bab5b48e2d6ea7a88fcb4ff25e10b758d509a +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..390e511de6fe5e683fe984952066066dca14e475 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dec3e59da9ccdaf86154f58497ab88930295df0558ee261015aeb7a20b6acd3 +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc88078251316aa8ac07edcd7cc57783fdc686c3 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f922b80055ad9e0174a759db946d539fb1a31d65c057b4446ab85a8cd909b834 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5d1cd49cd9badfbcca1d6ace96fa2faeaf2113e --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:311de83075dff341ac93de5791c5e9225a0159eff31c1afe2e89c5ab28297a93 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..088877a259248a185f84f9ee436e0de929d41049 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d9cb64002980390a33f749f24af24fbb7cfde4050fb9fa20eb4a30b88ed99a2 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..139df143364159b930954815d787ed73c7b62f67 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfca94f4ec8319add7ab08abb3a3fadf0de7443106287786d9f75393083991b3 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed5632fa625d01cae5eb28b71064c2b4f4365e87 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:533d2a7238bd72529082d29f16a6d197cc227881e221102c73e07de3d7a32cdf +size 199058647 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..008bb4315a1c9b1ecb4eb36455ce59371f081f20 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa01d7386fd5257f4d64e2facd449e3658832bfec217e6bdcf0139bd6731e2de +size 199058647 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..032ec0f7a8d090b9b9149ef0e721df4615f2c539 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76dadaa23b6adc64453e1e411a11cb29f8b632a600a688e768383107982c7506 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0992c47dcadf998829b0ec707e4f156dfa81818 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:337e105bd5f9baeade6072a79093abc78dc71566aebff61a5b1f191f819d56e1 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3dfde59716229dd9a08b85e93d95a7ada45bbf2 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc552bf8ac689fc557134ef9af1a4b68d27d9a8c4a2c6f664f82515b4605cc9c +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c884fc052028d9e770d2129b4a61c00bd33707b --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77683c7649ac11d6d375c9d70e15d29c5ed4f9707ac948a88feb88803f2c02b8 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b17002b252c6863b99faf17113bb1ce74cf9d5a --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5ce6e05b0cffc8e97e3bcec8e5309412a228bd738499ed2cd42efceb777cef2 +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e12070dff0868420a4fb2b8e3f41dd19c82606f1 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccef1909b515b6ac4c25ba1f52670cf6eafdb966bff87bb3177873764d6d021d +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6ca032547e331a4a1c7cd28262fb09331dc1972 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53e4097bae06b27aefa7732f3287e451060550316e612be799cc9fae59cafe20 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b27a816b15f754ca513ad0d56fdffd4dec79204 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0239fbbf3e5cb649b1ab31a1edb75a62d268adf25d04142ec4e3e470daf2350c +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f3d1f9bbf0f9892d07d92f1fe6f4e191f3954e3 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3091a45305079abb122d3c0f195c72ea395651edd8ddd1e1b2000923486c4eb +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d76418be6b9d9c979f6701148374cba08d9f6a00 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9714b490ed9eb84f1dd494cf859aa4438a284dd6c564f94699da783aaa47b294 +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a0bce368f7288775616288fe9e7d0ddf0bf87aa --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:754412c5bec373598bb820d50879ed46fd29154bda1444daae187b72daa77088 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc96fafeade0e54715999c5c9c5a877a4f97c633 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf535438087b76d3a93d909e696e47cf0bc6df7736c93735c3b6a32ef7b0ef2a +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0343d8283a287b67fbdc4e1a9f1cedf2d8671368 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51eaa57c199d8cb9d59e987db553df9ec31a8e8d3bca1d552ef2fa87f9385c9f +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d437e306b66b46548d8bd19bedc7cba2e2ca0b69 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28efe0313b48a71f8cbc55a7e251c64d804a6c1b1b7f0ea82aa04c515f2a8d68 +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38e4973e61ca78c274ca5dd808892b5b76a1ed9f --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2ceaf61aa09f107b8233b1d87f599517fe0a7756aa979f9377a213119eddb73 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2a60c6252f751a2c4f016150e8993df6bc81cd8 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c87be6d39afc96b0f812e10ecc7f45ccb27f64f03f0ee4287b183fa84c6221f +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7a472a94f082d36a316f5ec412b5445c1aff3da --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4088700afb62e801d80486ceb006b9ed0795cc71716fcc7916fa2f6d923cd7fa +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..efb7645a24097d36a88598072d39950615788701 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7c65b65d29f8faa3ad866d0657b0efd777bd4a40aa68768ec8e1c4eecdbd5b4 +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e8db5db9c0c46f5e2546e4c5f2439167ad1cc4a --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe7e38c0939649b4f07f62b60783cd99dc9ebba41088727a5c38765c75b576c4 +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3da65e60463456bb0bb3803dc77d6837d97365a9 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:789c9d3759bfb8d1ad8a2ace6a46875ea0b37ce23d07bbf90547b0ae9b48bcd9 +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62cd6a8e0b3a291977635ad27ec8ceeaaf2ac331 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffea5ea32f8d68d5857fcd58de01cba109967b0221dbfe1ea2f410a896262c74 +size 199058647 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9ab08338b9d17ce80e4a2bde3a1577460b94273 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b36cc9c64a333d92fee42b64e525dcd967bbf97b0555b4eca6d938cb07133d1 +size 199058647 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6b28e89f9445d8ad1d135bc64263161e2c78522 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62163149079f6bc40e6a121681c71002d2e768ef87949b2d6f3a9fbe225164f4 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3774e2676629fe07131f13af548c6db524d1bf56 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b7b186844bc549611733407ef003b52aac1b417c2117643e42204ff7afa1d3c +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..277f179c1236b6cccfac6e01d4d0d8d7b2531675 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9b52ba5c6f6d56d47dda7b3a680d96e0b40f3cc193bc6b51314265c3e37ffef +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18ea0e0b0852abba059156ae94199f764bf00e82 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:564d26a75d180702c0417c2c84d31ae546f87e589aecc7d4cbe16b4736a76bab +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfd18e1da52c7a67be2b70f13c0f679175bc2766 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95b7e6041864e0f0a2d6d4ce7c16aa6373d8a5a6e3fd4f1160417e7ef2011d94 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0312df0ed55071f5e70c00e3d0a30d15ac7a232f --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc34db421c6eedbffcc1cfe877be42ba1465cc74c4ec0d9e9b5aefee03ea9441 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..037ea28110ac35e558e0d57f40372982e26044b5 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f394ef4459df9931afb183096d46505b174700517b36e851470a28322f90a72 +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..babd07d8f58d3fc4440e7c08c9fb44544fe28bf1 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2269d5d45142a52fd62ebcaa96fe8db3fca26fe52247273ef4edecb75e66a7f0 +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3227a13538badb6fb3544a8bd908f59241b62449 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d64c92edd319bfbc6ba4f904d0bc73567e0cda00a8b98ad9a5ddedb4905ac6d2 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e25eda1f9556d516e8083a5e552ef17d654ea7b --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:198fbd99d5a6cb3d8777e9240bfbe164fc8513cfb05711f6abee79708351db0c +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1088741704250879fe2ba2ccefcd9d48c487d9d1 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db735613ff409486ee836926c895666b579865b149e3dfb84b13fa642ce52aa0 +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d7e93fc7d26847c116b60daa5c1af6edce55b91 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c527f6ec6fd67277aaf2499cc04901bc057c6d3e0f97b63ea6d68d5ccdbf57e +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30ab770b099cd06b5f9740c0736829f12c04ef92 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a991a11a041d5bf1b3e13f706cad8de33139595f53cf58ccb6452a06dc1b6f7 +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86405e0904516432992b640b0adc17975c914cc1 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:021165b75c18aa870d09d449b3c42d3ee05a3b622e6bfecf50daf6f0db0e9fe8 +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d397484a3746b3d0234fff2f5f4252ca1791dc69 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:299b06b24849b59f1a10d7a6d6854cccccc708a34d104bc60601caa90618e3a6 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9dfa5e238a04a7bdb9522ed549d3abef436680ea --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11b4d7766e05dc2a49c9b0716ef556c75a533b80df8c8ccb78d83d3c6245c48d +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..291018b7d986ac00f3a90d8ca2333c602251b078 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfb9029d258d2bc35c4921f302756836de5783ae0e09baa5e079a245c8d16776 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10b888e9a992aa2f94992922dc7c1d5dcb76faf6 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af9a107b6ffa8c927b9346ca478eebe67f2eaf6d507069ebbd9d41724c8eefeb +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56975ae7bf2f2c921e2e83b121b2e537026851e8 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6bdbafb26c6987c466f2961fb552f87aabb1753cf5e0d8b468a1bc0203f7972 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ab3a4e96bff8deb12f48c6ebad9a0f50638796a --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9093bde955a7e51b76780eae3a60bd33877d1013f742b3f0e965753ab03bf559 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef559022f74f676791460d8f32fcad9689c3ccd9 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dd88302677c4789ffc643f0804a91de1bb814df1f64458f285eda40d4141b77 +size 199058647 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ac657f33bc0b0636fa78056b5649b0ea89a812 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5326908ff3845baea5afde48f6bcdd151906e1a94d9240d69b75d46124e8136 +size 199058647 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..808dd593c97abbd5bb1dec4f1a741c8fadcd68a5 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec4c3dafefb5cfa83cce9d5a82f93c09053a6084e4dcca6138f051b95f3fbc0e +size 199058850 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af9065d1237fe5ec7ebe487a7f25190d2865ed05 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f907db095a3f5e5632f135a8758232777c5de88c35e5e3524d3d683ed18ff74b +size 199058850 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec39cce30e0b017fa41487f052e91657a46b3cf8 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:031fbb848ff0c8d5c399edea49e0c1d0aba3cd5ab540e6615aea359893538050 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72c8ead5efed717eb35772b3b725c0766ef399af --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aed6241af2c564279a506f8b679ba170f5414f3c8042badea48ab59e0da873cd +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33924f4df894daa5b79f85861823131c90cc2609 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8997bf8e18f0af7967b100ec6e3b320188dd2f78f4c93eccd0e60c8755b309c +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad0914d93f167e46a7eb2ee5a535ff8b9b808e68 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b8d3984f0ce8b0e0dc368e36dc1937a7a22e7487b70b6052790490350eda868 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3e5cacd1a26d1e4c24fedd8df351cf9e6c36abf --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:145988e2469253b71346fda355521901522fbbcecc1663c28008086f007243b5 +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c5ca03ab3a2c2e95cc8e9feab1efffebb5522c9 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8de9327859338399e3d660c70be61dfe22817641602bdf0956ca4a5adfbd085 +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..076274960939c85670ba6de93a8cb06536865284 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5223ef3b7e84694d5bb0b2fd4ce654cb5c121b72ab5ee87e34dc6be400136336 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7f75af78ba4fc52161f5fcc3c7e4c6e0baf2171 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fe4dfd4a36d0e685bb7494ecee868c16e03fa5b4740883e44e5215cc8ced0cf +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ed225063f20562c5da089fdfd5e525626522c8e --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b098475fb362f95357517eb75c07d22e04d406292e1aab54bffe5bab8813afe +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fa29fb5f3c1eba78c09defdce78126808b78066 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75a6266e755b61a9f376b835f88824a5c5201237000aa5ab7d4c7d063ae769c7 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2fa1c3d7a9f5c0e23d2b14e4e2ea78cb0bcdeeb --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c43ffc7db18071375f827f7566def4dd4217cdfd4f6fcd141a3d49b838a1114 +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00ef644a2e16e109196ff26d9a733e9d85d039dd --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68e05a0dcea73bb89892dbc6446afea00d21ec12de447aac108090d0f17cd2eb +size 199058722 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6caf4be9429de88a44ee0412c956d1c1d4ad756 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:403eb8b86cd4524b71f8bac79535b10b65f7d2f7bf63391ff147d22e096854c2 +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f52a8e9c938ae86e377a21402317ced4a0256fae --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce04d63dc36b7832f2acb304d235c01566faa2b4de3fcf335d990eee1afec709 +size 199058786 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86e686a769cb63434a5ebb2abdc75956f1d27dca --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a13b934dee38ab62a54ea4c86b9ba933ecc894bb2ee32b5f612de0cbca554788 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0a6d5bfbb53751b2fb5b0f12289fe2eb6bda153 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3cea64aaa6853e123800a3e4359a8e7040ef56520ceb0ff0d0c0db0295e9200 +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5d96c06980a5e8ab9a458a35f11073066703fb8 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d086bcfbfe37e0e005226a459ba0fbbdd7b36c1c741710415b1f73bf822cf9aa +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1aced7e97668401dcb985edce2ba15fd968e74c --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d62959af283967b0cffe585bf387d2df13f12ede4c408d09016e29e4925b8c +size 199058658 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab9559acb4f2989d68c5679a25524d4e19b98452 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b95c6b5c4c042c302f730315ee57b56535e9bd216a92347acd32d1f8c51c19bc +size 199058839 diff --git a/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..635c0de1c6513d69aac603719b271a55523a6901 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cdc22329a4ffa8d516135dd4e12b207b3d783e8443b50fa9ceb13f1bea4d70d +size 199058839 diff --git a/4b284b1b9oscar/global_step80108/layer_01-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd6ee0a2ca2756220797942dac882f92af6eedcf --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c17c301bbc18188f7faedff32044425ec070c79dd781514acb397fa0d573ee5 +size 167511299 diff --git a/4b284b1b9oscar/global_step80108/layer_01-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2b48ae810f0546c57e26b920b5bcec432d5acfd --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c547a121ffd4e1c77894a29c6e1a6e622c1f670ec52d4f609db303083f0933b +size 167511299 diff --git a/4b284b1b9oscar/global_step80108/layer_03-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..452fc176d65a7e976d377b09b00e08fcc4600deb --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb79ec6a4b38d0585c36457b196c4e033feadc6a8173c257915388097bc11bcc +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_03-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9238775897f508909c56d75c5b47fdf698e12752 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:218ba1c42e30885d9dc65031027084a187db6efaae73346b047e33f3401c73ea +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_04-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc08b821915567a4f685b831408a764d78516e32 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99ba7707bbf351a00a6afed039edb70cda66d1a5b44078bb824f760836f47c60 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_04-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f52ca77c16913268d4fa288c9aeb1090be3ee06a --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bce7f53b8b7f4eadf6dc1d54d070db0891da9767badf2dd825b3d012c127fd4e +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_05-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5879b7e5346ec1e48876874955bd6b702145e3e --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7db892b9dc49ba9f960380417c5f28248abcc5fb0eb61663d5400986ff8ce951 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_05-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d004f09d53a16fcf2e3925ea7a538036b93967c --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cbd7a660156d7a0098304febccde3ccc8fe7c9a1c39ccbd139248a4eb2524d5 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_06-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb8dbed91870d9725de8365cba4bbc913e5de383 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4067b2b0266f78ebb0ff878362e450472a9cfe84e019b6150dd5f701922b5692 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_06-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3014d0a20aced26f386a5f47322d3aac1a00071 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:460d3a1d8fb81b49eb6c4181541fd39e25305e179ae75c0b59f327b6e110e92e +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_07-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a356e12818a2706e573ba8690f6d387d0f5165c1 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa1a3d78771022a49018dc6700b4ab6ba9d6d94b53b28b17b80b827403ec361d +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_07-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1855973a8b8c3913092cb9632bf26fc3266c8077 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76d36bde38e1aa0eb9ad6eafb6ec9d17d8532eb2c0ecb083ab13537f57c6f6da +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_08-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5168fc0dacb4fc771c8002c33b8d90fa260645b2 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caaad83e2b9b89b3f694d7e0c76c4011968b064b266a966c1f7ff64c9b931c5f +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_08-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e0ac237eb4d9e4ed8ca8787a987e8b143b4f253 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59d29069f0dbbf7acf4e6ad245e237b695c8b4e84183cf00c2c7bd7f962b530e +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_09-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b9b6740f100d31dac1a98ff6eed5b8c454babf4 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0901280685469fc301a5e68924cee8b04893417c254f1165c0cc8febf7aff93a +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_09-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38d1b0e8d0f97ecd5ecc10b3d2035f9563fda82d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40930b4d4049e5073d1c84fccaac8be945e14bbe4eeca9940d13cedd8a780a20 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_10-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1337d4fbf8f077a9266f7c7654086147954425a4 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2546e48052f86aa384b5a84f61f411b41cfa76277d36fbb3685c81cdac30500e +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_10-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd9d589228ea2862707319cb0615ffd6bf36de49 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93f96a9fbea848f37d358cba643bed318e79aacbbaa4c20a5520339f7ff01db6 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_11-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..946019dfc77b9c2b7148a2aed9c9cc06ae768949 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56e7f15e558d19593c066a89d335b32d476a9e71917adfe57efee98d558562c9 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_11-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec6c2f686f1766e1184732b83373975de87e820d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a875b7035e1b70f12eeaa6d4a8c022be23150765349e1be1f7dcf65786340c35 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_12-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be0ebdadf5ffc6185a73c90e6141c211443bbe4b --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cd26d2a971efd6009c9af7f27542fcc4a60a533b1dbd73af6ef938629efb589 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_12-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c33a4412a273210f69e9fdd3c23a6af241b2a86d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:635233787bfdd7236a828c079efb05d7fc3fabc6cab8626c47ffd5d01188ec85 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_13-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dd4e5a8cca00ec74b18c26a6349f13c302f2513 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:135d9f29cde5bf96cab9f9278f03040ac518daf441f41c3168699dff449ad6d9 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_13-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e27f729477ad8dd948d436a7450da55ae0e536b --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07eb885d12b602883ba385769613242c6a15881435dbba9def2a0d049f20dc40 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_14-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a29c789716f6e556f50bc82254a4dcb55f151b58 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bf16613462be9851bdd2cf2c077b70252d2d1df5732cbe8aa225705e6ba155a +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_14-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2fbd52861d5a0b5f790b8fbd30e988416f8073d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4be984fa65e1d568dc3e7d4f43c686d72e64a8b51ef2aea36c4d5997a968a951 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_15-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fc376ae80c3a3e347a88aaea9188edfaad7fb53 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48121832e01d857b03a2abc245a256c2e32b4813826a2d508b072a908f2c3ae4 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_15-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20c0943a0258d8eadced91f46072a1a1a27d4b67 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09c1fff250d3abf5e39bed4b2735c6aa7a238d2b0b8bcd5f5bf4d212af3a4332 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_16-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a0f635a2dc9ee4e0c41db8c042e2fed54a75b51 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b7545d5fc0c2a7daaad1af2a441bd2bcd57d271575f3744642f3dfac6203b59 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_16-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31b70641b0b5695e8311ffd2be6ac0ff23f0642e --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b50b04b41abb3ef731655c877b3a8e7a7048e0da23ecfefb7a43474f34e5e18 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_17-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59900851ce63e3bc1f4f0a271081bdfc818fac27 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee1adb3e24a74fcbb0956f80ac2b48178c2c957ea71d1818dd70b28eb4c124e9 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_17-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32bb9b3cc3f996b8c65576a132903fd9f61c4814 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52d1ca31c5de4a55656cc497fd99ad2d919993516c698b9a60612ddcc5d566f1 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_18-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7401db6cf0d7bfe1788ad8bc2f91e187724c4f8d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8218e73c6ffd9ce6f38ff1b115fb564ac2e20a5359ad7a6ee168721c05649cc +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_18-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a4aad02c130b80761d8ece59a600d3d306f4d4e --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0267fdbd9b20acf9d91184f7386bae5018555c5813069d378fd32c83330dfc98 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_19-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70b4ad5ddeaef4541990ebe150585d77d4de63df --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ce4041d8f0739d0443584219649ea2d5b799dd46016ef66665c4a61a3986805 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_19-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea72bc38792bb0da58048084ca760632070118ab --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c75c2e00722bc42fabc6bbfeed12f1567a6d54b367823b019ecf9753d9701cbe +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_20-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d128f5c84f05652d7f053d016054a94f1d0c1c40 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93509acf92ae50719d525795af02527f7c195918a4e8c92ee08a35c2488903a5 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_20-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b3ac6fd247032fc982edbc0cac1a42dfafc551d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:391ad3f21a6f565a44c128e3e73eb0551aba612d67dd9cb755a6817eaf0a52f7 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_21-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ea6247a6599485cb134946e28b50a82cce066ca --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df1ed77f63d6c1408c12fbf0522bc209d78819a6ad4472cfccce93bebb8f9d95 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_21-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55ce6a319c3021f6ad498435151844809ee65e43 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b416af628fcd6af28bb15ac50bc2f53e5768ad5bf53f1ae41d1be14b42a01dfe +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_22-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c6d1f25f76b09b7809269eebeeca5503b8e12ff --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7976815547f15ea5763f99085ce794aa6b437fe38f2a14c03a6c82bd702e1d2b +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_22-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b652ec5ba0e8427fc337a25abf8958304b5e569 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a1d717ffbea164bddb2ecdcd4088bf0f383df9746a982e27f7e9b7ae825f3cc +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_23-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25a1b140149de70f818f6c8ecafb6f48d50ce6d4 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0323ba7102bf1b1672e0be293be0f2d2e6490d3a9c8a8fcef84659d5bae079e4 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_23-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fab24f6ff7cbdd2719d1454ebcc67510b0b60ca --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dabbe8ceb180dd70113dc5e7c606c5ad779108e75c5e08d393850c13fb4b674e +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_24-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a2ddee6b6641c296d40426973c1bef36f061469 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bed24e3fee22f0b01dd4dba77830cddd6bc13b8c7cb9865e49164161af92dec9 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_24-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08cb93707f056b12aa43c9cf042d64adb7375870 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc624c36549374690918bfbdaed226508a11247e7c439198b5dde56ea3b5f3c7 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_25-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67b831f15a7acacd8a07c6d106183c94f34d8e2f --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96a5c04641e9e39fa4b1e6362d8659cf3c7db1a9613a71ca13663b1d427df9ce +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_25-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4920c02cacb4b49bd0594b8d21798f93cc280a4c --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f188c804c689b3d022fa9631c41b9ffcf3a78f346cc74d8c900b50a7bd9bafc6 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_26-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d786d18664c472489c4063329c8b1ee9dfda524 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfbd7be176e1e93b502c89a2654e508206c1a9e01d0a088628cae70150979127 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_26-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..831e2936d41788f0e2c33a8af6e23e726cf9f190 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd71df25d87cd88bc5c51e99a0e53d99c6ff2aeaf3c61cb812d5898d7e1dd80d +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_27-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a4efa2fea19c680a00eea1a7568a8474ce5aec4 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfce39d8e900e954da508fc828def3b10b0faced8e4a604850ccb6888208687d +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_27-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8f752f21f8f54290bb56287fcf4877184652fd5 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b74a963280401a183657d2c6b394f9ff7495a590a60aab76c6ad08cf9d9097a +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_28-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cb3da61e3dbdf8eb701299fc3acf7796f10e1b7 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02c64b8bb64a057e1d99941d3e3db452dc4ced2e7125ff0810e5a84f1e6055d6 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_28-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ae5896f06fa25c3ba4199c73e629931c1efd73d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:400882a1f70074399718df40282499e859d71c45d4cf4060d76b5f6d4faf9dc7 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_29-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bad151c2bfe4ac25c0f42450a259d1a1d528597 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10108f70b2449e33e824a05c640a75eb7e4ad213b070e364d8b7124fbb10ac78 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_29-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bb7fe5157cac43a3a74e20441006f3f78686b8b --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88ee9aab665abdba9327f1342d6c8db998162b85126951510980b7d12f7fb99e +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_30-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54f39b9cca49ceec5357cb0ed4c5a7d9c963b5e7 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2865c70a9ef9f2c33455cfde68863db74d9b6c70080e4d4c704e25c90d077389 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_30-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b60a87c22a2082a84fb3cae68920ccef03fbf82a --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:971652d799d7fd7ebd236d0c5a3cc25705b88a07e1e6df5b90a246c3e065bc77 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_31-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0c5260e42e8f2596bbd792d660103db62a62469 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fa373b360aefa21cb63e9725db7aaf373c422b56b0678789b9d3900c5715fc7 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_31-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7c0201f88b72bfbd13ee387fef85c7924bbf876 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec135d9f87a3a945b6219303a12d5d8d93349df627b2fe46ec55cedcabbfe6fd +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_32-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b76fa2e7afde1c1b7f9811f2f006d1e3a34c478 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c0315575d30a4c35067551e9bddf26d0dfa262ec22704c1e5674510f490c2fc +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_32-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e1c638b53f3be1306cfdb604f4295056a80694c --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ebc830b400804a5886743d6e7bdf273e1f496c17fcb514a3ebdf150b29b72be +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_33-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..795e83cf53be66646f19cf16bfac441ca050cd05 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8f524d065b8fdf5997746de27f391cda3de2604e358db4650669c5121773066 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_33-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed956c1f6a4f5e2e7f72e47055e265fc0bda8e5d --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:995f5050b8a1a8944940ca903bfa209b8f300840cdebc83272d8457529e3e858 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_34-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f3717db1fca71019ba0452ba65d6ad9fd87dfa3 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a718d99afdd7341d8e78ca433876b2e0d12a512f1a69ed6bda8eb2f9e824e145 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_34-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..690c201accffb5cfc0f1a0b4d7d2bd81b93a2388 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce9d4a0e4dab609f1a36612fc0a7154ed21a81f453e742e46a67de4e1c4888a1 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_35-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b20ec4420c2e0046947423f17b726e871ef8f55 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0cc1cbf8e6e8f95aecd0f867799e3b8c0a7111f8bcf60dba14639e364f119d7 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_35-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d78f52843a4f52711a634525489aa21345c8c7e3 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0bc18373467d70500f2f68945d29e1cae3e05edc1e0b8b2dda7db5909743e4e +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_36-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b8908a057c9cbc2bf2ab3e9e8e3f0c7249d1299 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc8fea82924b6bd21894dbcfdb833ee66eefea690dfe154e0b0101fdcd703db1 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_36-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49d97e10b56cc3d8e6eb52964cd4c2ab56c263c0 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:441386ec5c87e065c1866c06b7d2b71ce8c94febe2f49603d365ddd7da05af65 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_37-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af8daa5b238e0780f792a05527c688146ba40cae --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afc913f305c23bbcf495f021d4641c4a42ae04d01f2288e91649afd543624a88 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_37-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa55d41aad06ed0a52b0961d64605109aff2b11f --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7dc244d5d6a9d0c5d37d94a76f052fb6219d930f007394752f33029ab849c48 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_38-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cd63e2613c8eaab0263a26b1585cbaa7a71acf0 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8c30f7153ceab0f0e851372812d28cb8647e9677b4b0437ab44584ae65b9559 +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_38-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5839362d593188979a92281a98f53ea28e8c2c3c --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:728f901f82c8415676144580c799d57727dc17aa1adb53d4c97e8ced8522e4da +size 113308931 diff --git a/4b284b1b9oscar/global_step80108/layer_40-model_00-model_states.pt b/4b284b1b9oscar/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68e7aa69b2c1724135f927b2782323eb26db0ec2 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bea4758ec3f1fb28eccf6191465dac30a922fe79790475dd1df423078660de9 +size 13507 diff --git a/4b284b1b9oscar/global_step80108/layer_40-model_01-model_states.pt b/4b284b1b9oscar/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fd5b3771d03321d30e92ba2896719d30d27e16a --- /dev/null +++ b/4b284b1b9oscar/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7670a2344e43ef02d67fec501b974247471d419c1caae300be429341d3ddad19 +size 13507 diff --git a/4b284b1b9oscar/global_step80108/mp_rank_00_model_states.pt b/4b284b1b9oscar/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cdfe4507db1bef1ac27e6becac143df53950a7b --- /dev/null +++ b/4b284b1b9oscar/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66467ec6de5546d2e6fe2d3094cf00498137e355b9207c0b87f34dc9003743b2 +size 51635 diff --git a/4b284b1b9oscar/global_step80108/mp_rank_01_model_states.pt b/4b284b1b9oscar/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..199886992e8f4cf51eaa557d7c4706ef2efc9a33 --- /dev/null +++ b/4b284b1b9oscar/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb4e72e2593a7ec7813814c8075f0d78a60a4497f04c6f8cd35cbc04dca399ad +size 51635 diff --git a/4b284b1b9oscar/transformers/config.json b/4b284b1b9oscar/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b1b9oscar/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b1b9oscar/transformers/pytorch_model.bin b/4b284b1b9oscar/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..6cdd56ff9588acea7ef0f70f8cd2dda5cf6a4e7f --- /dev/null +++ b/4b284b1b9oscar/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbb2d3dbc9fc4c95344f4d9ea448453eb9f369da89e985a28d26bede26e6e2a7 +size 8781203669 diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..71438558d96aa8e29a5d36db26ec98bd827c4c87 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.36519721260505666, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.025416271815881648}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0844897373726688, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0033773725125629405}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.23505539103583917, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004740597986047636}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09543970962631343, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022861713036904717}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03592938600180986, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00210536271605171}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.10454144700558925, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002991020929264074}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.041333131309197434, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013620781060247143}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07802708042033951, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0031165021391665213}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.22121439829830997, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004485457598638524}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.08838912443491174, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002036320437905252}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07911969436604507, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003179215199169328}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.22011099433358053, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00444184711183466}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.08923543208494557, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002110955534608439}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..fd99283e039ce22a49cd31a1e68507f774216cd3 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5519911539819539, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.033751880183173925}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.12331067244684876, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004082368422597041}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.31067053294857805, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005182304056477733}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.14277887519027355, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0033087097604432773}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.05879868858584044, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0025734193041066717}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1541442248192973, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003625807681257247}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.0689826995733388, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021268339152713998}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.10996896485273867, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0036089432128995863}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.28822355849070946, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004809494638384607}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.128307323996298, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00282945845782325}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.11297536382690374, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003702439687681051}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2915639206677481, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00481999513451822}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.13128489500860036, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002907234369940614}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..231e77f525d9ddffde9bc1146f5171f93a492a4b --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6339259316631447, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03754173222757458}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.14667562622284316, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004546019252257184}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.33761348515048895, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005110492360257298}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.168229929968101, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0038502408432064105}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.07392396630393584, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002910921521885995}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.17359484868950906, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003808651746140846}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.08528944755820256, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0026434056022395106}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.1288399060647976, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003895576855972721}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3103792864337978, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004711801576435388}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1496329946991757, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003280688171307162}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.13322165186378207, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004047868682932482}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3159788458391283, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004761168810006645}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.15396679917311523, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.003394295596411652}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..0b7c0943e0a97a2e378cc326cd812ef764da1c40 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6987186814977953, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03726726363431578}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.15628268534165624, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004738048768606994}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.34564779827066666, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005157301361583559}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.1772674836694056, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004003003892382963}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.08018351827536892, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0030318772722181717}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.17720834755097986, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003776236033479815}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.08972265881218434, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00261456940628482}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.13619096966611585, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004034691857613383}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3156533014362113, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004683382698871321}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.15629910293144808, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003369049215518736}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.14106938481373726, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004197327906695634}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3213841281008155, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004741735159952386}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.16095302857465682, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0034922988800979277}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..a11f058c5a551e7cfea745cd441dd615942e09d1 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.8132044575049523, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04307840489572349}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.16347759704430803, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004695561092843388}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.35695621876500805, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005056764211988934}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.18550929394489915, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003990007962496953}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.0858985723582815, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.003113033333072909}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.18657518824555228, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003776015761108268}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.0960354351793, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0026996759143921977}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.14325359283567762, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0040366290353170565}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3256089247902154, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004566067865026425}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1644313361150259, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003403269316136382}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.15000521793249683, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004250104475550225}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3336933733374621, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004658361144305201}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.170863611717608, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0035686647188022296}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..558fbbdc28bd24f65bf4edb3519bb43f00e2636c --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.8670271385825886, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.038538862378515414}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.1746489304105952, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004927634414508578}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3570929599577129, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00510044731414704}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.19328046067966642, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004083786207840732}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.0924457972411747, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.003250827483560766}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.18760801056883655, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0037583338280536365}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.10069138588522752, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002733147395415775}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.15182781815285762, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004212740165200758}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3245349442455857, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004655183104315666}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1700662023680743, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0034658127030782362}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.15860186322431297, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004433084191627986}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.33239822166212296, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004736491841462652}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.17643940357846452, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0036208712156513504}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..a69e5f3571fb8e28bf0358f20be50ac562b97336 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.16375388077824185, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002786961439555472}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.23310439134422403, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003221909660619021}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17320949923781243, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002378543620701129}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.037266624556334636, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010454923920460784}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.055875994550861, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015220664383122282}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04061809653735023, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00102349832826798}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.12625756972987834, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00222128685798661}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.18307142060592155, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002551731495842583}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1331660737775357, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017286047933073323}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1540530758011259, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0026719075792983353}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2189816298141472, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0030502375778628647}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1625224304576826, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002244458298481143}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.7351635777602485, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07279508876749892}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..87d0c7438d181761772c0302e501d0c396a06360 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.15123352006056198, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0024770673760679054}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.16716913934962777, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026348428468133418}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1373767191820474, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018611394817887653}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.02431061845270688, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011837421322610725}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.028272726146180985, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012762421213196886}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.02159662859311345, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008580677013526128}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11746495228060996, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002010782143494058}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.12901316733192114, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0020475246892545985}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.10528556398811369, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001369577875772531}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.14415394863180697, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0023568768994817993}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.15910651619208108, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0024820476138855316}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.13070955427136605, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017418060665744168}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.5561631327305139, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10739388531682377}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..b30942f145dcfbbc7eb55d74f4510ddf05145c1c --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.22357648926183488, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003403496745004805}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.23108898978062387, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0030992082209375404}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.192430862820694, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002247003523313584}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.05797035629216586, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0019885419913011878}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05603656429890668, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015489521328666466}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04630531032723199, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001181587468860551}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.17191667887153705, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002828831061851297}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.17481639425872558, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00239216857453571}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.14514841535686332, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016966632675560788}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.21113970538486854, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003241662223820054}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2176159104822485, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0029107305579356567}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.18120773649298935, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002105112894775109}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.9166281994554626, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10032940921674821}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..bf138f9c0cffb7f5a51bbafb7c04be6535a8cec9 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.22569902995445462, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0038809742804849726}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2086225275591831, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003315098779166745}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.180670243747566, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00257608420712232}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.06416547038499339, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002252696014479526}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05497059771205241, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015764253563869673}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04738710642101166, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012700610973697954}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1753927608616659, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003290552112282621}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1568733502695627, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025476820762455315}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1360067434991587, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001953782240535597}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.21377973674170142, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003735318958801609}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.19665901832256616, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0031297483130912885}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1702338547406735, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024243380669135895}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.779506277921281, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.12229466738338372}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..535deb95656f11d5717f4b567a41ab07b443e0ca --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.08172885429788375, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031593114449411995}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.06880607657481164, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025890657802543843}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.06135106282233744, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002155687684091724}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.02333833752926271, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0015030616397154965}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.018396239255635764, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001045632678195372}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.016306136251979797, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008516499355170893}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.06522015073123037, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0026414107544845554}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.053199755807901684, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002028938653804975}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.047481918108786006, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001679846765086699}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.07691174733451789, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0030091759153711927}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.06407113817992571, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002407483027587739}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.05722336037021286, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002006378468825137}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.14389085369232565, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.018449228139014652}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..e9477b6024c3c1bb4b9ecec53b264d605d147977 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.012848959719309508, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013119884844163163}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.010311420129546226, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0010848349785527766}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.009463053541826822, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0009145339358699636}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.00383713070490352, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000679000049070121}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.002691389750432684, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00039328749507485294}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0024767980328090607, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00033878203552135646}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.010677492926423284, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011412324336550364}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.008217313076562338, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0008636920884600956}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.007623920574636888, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00074262701496866}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.012210240397913602, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012594872826179838}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.00974458097545787, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.001023511123119965}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.0089451879827669, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0008630902539268249}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 6.788927091230416e-13, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 5.3190288411298046e-12}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..13f3d3cace92679a27d60276ee1179c9e0484b96 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 0.15232871634896603, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.020812270261486823}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.01770379177388514, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0007712828154957143}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.028491661886720938, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0010891578916398857}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.020954271163547446, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0007980489867592098}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.002501895673880381, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00042732541832556033}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.0034077667682669804, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0005511526902650941}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.00255026898454171, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0003936972479245331}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.01712932032724213, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0007023823982565856}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.027450404231693933, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0009294384582174001}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.020230168243995296, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006931916013766407}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.01715807340633443, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0007495810339305068}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.027584765389295527, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.001051599270290686}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.020282346611517486, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.000767526686930157}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..cd5067220b8a5ff67a16bf8c18ccec4d1944f1b9 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.955740880134837, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.15642139786964473}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5523543366276142, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032273194133200615}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.42797708934193157, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0030241470346410635}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4567598668167415, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023932905161546223}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2643215040772804, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026722105312840154}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.20215308199057408, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022121806698831336}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.21585820859060773, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020692552291630066}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.40750234018593817, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002971833950463029}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3125157249212724, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025035354662693373}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3344463176631742, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021371990381405573}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.45652280658634536, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031709106886728365}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3523732297311478, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002796550103045126}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.37643903958132885, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023685867771283033}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..37ab54dfd8e7956b6b686042b6e8c4b2d23277f9 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.897352692245587, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.14980000038720503}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.561794916535469, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003099458635885747}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4567589519097586, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0030026914172325615}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4802344330712051, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002320930303516199}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2792219908408161, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002614017045402319}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.22598550083511856, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002301745671244508}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2367775628405086, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020846614978106194}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4125697759457242, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0028156824620878228}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3342012776517918, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025457481527686697}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.351524532586077, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002116811888824175}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4679766836272037, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003077550404036877}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.37978796737629206, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002832179161262596}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.39951857535439594, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023615361382931218}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..5a5eec3818aedc0bc83d0e58c2f76e1bd8f66444 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.426686249425238, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07922124112239044}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5680260430312276, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0030913554764194547}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.46062214346005564, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002938192474222987}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.48630114866568, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022963886540455164}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2861172769387419, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002690477373583243}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2310837031392793, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023655149673605107}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.24302456733362562, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021567426223923106}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.41780470464632935, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00284479912148554}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3380514128610829, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002554824733679187}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.35690884478009743, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021650316694958355}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.47406884298114293, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003048747619228675}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3848877688500459, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002821475089819001}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4059984680960094, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023597610029612243}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..659d86e9491d09d1d318aba764f1409633bf3ebd --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.2425385270368, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.12070465932038754}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5674339183550579, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031765208159065333}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.45589676217731373, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028927956512816914}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.48405302137560413, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023511056226272723}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.28512193921853746, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0027192588682938886}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.22748223092470107, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002317019903101863}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.24122038943708105, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002185560838559176}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.41854952516509386, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0028845475934422132}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3354088230242437, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025175251927694814}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.35621729860823614, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00219679008764647}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4751881399496292, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003113603195689234}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3821462060193808, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002793602104629368}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.405571228031194, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002421046900033825}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..3582699d469a09ca702efea5d2458721f58db113 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.361008320584343, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1560368843029399}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5690777901256877, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032322208735574096}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.45484384858111365, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002842522185270529}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.48445698386739383, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002342258145013874}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.28959806457707354, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002772700376334683}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2287344578632653, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022822820197528288}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.243596769826614, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002164197721918074}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4222734045194765, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002886687722686102}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3365984183167644, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002444470426579007}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3585342364636756, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021296678714575203}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.47857494456631217, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031621123336196618}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.38225762195387136, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027342556691813064}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4072114109794734, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023913662984892826}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_gem_xsum_article_DOC_summary_0.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..221c448b9615d7b6d6b450abde01b25aa03f9db8 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.14683911932801988, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0024209614448014935}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.33232051267525825, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004965206416592606}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1994811520035836, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002984688412674603}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0347877835737417, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011768705530675132}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.08224966786374009, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0027934031626812928}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04812859174134576, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001607211256469432}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10790546336960771, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0018864163308328482}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2448853816068894, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0038264085032181728}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.146380284799072, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0022388632798941263}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.1169016398885232, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002030057097593571}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2661904377997672, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004231721336986767}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1589223000999379, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002474373290963512}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.9735502840922572, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07275406618552088}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_gem_xsum_article_DOC_summary_1.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..cd49235ba26de29f10c9b7c0b192de1ab2535f3a --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1587565929424201, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002734028004150954}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2839429315342853, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004504901492577771}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.19188402550566547, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002827706721355569}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.029846851134275015, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0013392701936661123}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0574725840470226, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00246069245408357}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03709731053424962, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015618279370815137}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.1181498323911531, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002030579033137931}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2124355930003259, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003465890162302496}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14286744054243364, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021068352185527133}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.12248206747333056, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020938304134755963}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.22210978407966295, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00378568398661764}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1487243376167721, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022534985476107437}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.638300206290867, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07822743390841481}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_gem_xsum_article_DOC_summary_2.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..d6447fa67d8ea0d71a46c97cea6afb0f400f1146 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.17315356567023985, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032567814817309163}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.28736976708095296, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004257004996623704}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.20016621421606, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0029081034648420524}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03675600130879838, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0018004136622862172}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.061344714470415035, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0025169166680391974}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04221291192859074, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0017897129758792792}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.13304195544493516, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0025505916245897793}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.22240633657661427, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0033618144117980413}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.15402918525247972, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002267194194181029}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.13553932746039002, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002600318961574337}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.22810281420861347, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0036392464751532154}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.15727848493672736, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002372060789387804}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.8180132235300948, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10800461107815497}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_gem_xsum_article_DOC_summary_3.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..2ffabe011e23c07af5db432aac3e46c32337860a --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.17229167511698984, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0035468885296608124}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2727682959834323, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004455577411908}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.19568743419032586, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0032421572082825824}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03640068625403459, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00180003629009263}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.05714643040549625, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002391106418603193}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.040818146352504275, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001758412694246694}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.12934549628784311, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0026499682938759214}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2079367842088016, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003506259792687054}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14751313359534127, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002427984258029977}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.13258510136274942, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0026954493602500585}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.21466898986359226, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003760210367462346}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.15176201376572815, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002540088784293334}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.8375265128691776, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11380329430209277}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_gem_xsum_article_DOC_summary_4.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..b8c0eb10a5ddb0674d130401f1eab4454c3ac8ee --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.049854157064987935, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0030861147190811536}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.06666637829573964, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003951494050861984}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.050905820351251574, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002936649188749722}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.009568873692323173, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010725443721543572}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.01374863634918288, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014545824225490266}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.010127271795302999, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010361348734861174}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.03859045897117773, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0024258515639221765}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.05102740916511275, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003040146906444265}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.03882864608439493, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0022207318687529937}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.039682572877387905, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0025137153001535515}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.05223871369062228, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003168762214579924}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.03984498899321002, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023064027916115458}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.46372311709585096, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09429799136651668}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_gem_xsum_article_DOC_summary_5.json b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..0acda3126de33f645662d5d47a4a22ab7ab23fa3 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/agg.4b284b6boscar_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.00375709923706833, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001067372185961691}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.0027436329216451176, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0007640456916008605}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.003113321950673498, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008689581396887578}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0005930059273566488, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0002584437833429403}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.000410764780909065, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00016925078259344875}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0004798845639226407, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00020204272629620264}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.002781684748525154, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0007911433597366938}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.002025647482597874, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0005582402498199304}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.002297229116490886, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006358236397526091}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0031454079965436295, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0008989173681249037}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.002308538269140517, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0006456848704500759}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0026114688524966553, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0007315944509355694}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.1113865171956142e-43, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.4470133621020118e-34}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ab1b50df9356d84fc06e6ec1517dbece3b147fac --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a6bded556e5313eb65ddfec05423a7c30591dea5929601886230ee49a0299b5 +size 3872623 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1cc3add246aba1abb98b6c958669b867553979d9 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53aa6f779ddbdd796d79418bb42eeb68e4fefa4dd7289d2de6503e08d31a0842 +size 4764844 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2ae9dbf20cb24635767db15f1f5c6671a8f2a78f --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ec509a1e6430f4baf2901e6d29fe60aef885133d985c2ac5b0b3ea91785f6ff +size 5623198 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..86bb9a6c035c35ac5dc369ae411aa812b99b71b8 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:520fcbd89156c6ebe43a5d36fb459b1f2f87edf2e597fb5442f9084dcb6492b7 +size 6504098 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6db03a006c6454caf2f462352484af9b0b8893ac --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e02e1f9e69176f1d39f0fc2f081c216d90ff6e1206ae1eb02b08a94b8d82239f +size 7383780 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2e77fc0ffc531b13eaada206e76353038f809d6f --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9067c883b20c62591d937cc89174d245582ba36659cf46a08cb3cf300bca3587 +size 8260166 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..de610be2818e4b784ae14a0200ad7a7e2258c5ba --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33f099f08b7866856d202d5cb51c8d83d0328d5e2ede2da68d10bee004a83eff +size 7520136 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..9015241ae1c4ecf6f7811e135d8afbb2d5ad6ca0 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:370e9580173c0ed2984f67da5a3c293e4e2f64d804d929eb34f4dc68363a0743 +size 13073722 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..75dfa94b4bf6ab8b6a7c50cfc7d3f0be1bf3db2d --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79cd898045403b64bde4b008673751c29af9bd27d5ace5f3433c5f0ff13d6354 +size 18665750 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2fad0561e07fe52801aa084fbf17c969279edcd7 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d0dd0b3c0c762f880b21549145de3fe9f9481f7937414d00c745f62d0901ca5 +size 24117513 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5b3a59129d7583913b319f1c24d56589da93b9d1 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6c209f48f7e4a452d9c028f680c5d675e0e2c54f5e9ffb6b9fc30f9b50bf58e +size 29394578 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b6ab6a852af7fb4f36d19e527e77b20cb02d7f88 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8c3ec356fe2d581925523cd10da329bb72ce1d91e9f99edfdd1bcadef789a34 +size 34785894 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..72d72e9d92fc25df0ad65f6c1c1db6db18440e74 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b18aa1fc3816cc6e8232e09525f354500b277bcdd8330b0b3837d5e6cd0fdc4f +size 4490323 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..49c8dc1599ef56770b6d7a5aa6e89b779406e747 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:561fd2239dcc71fccc5710f0abac042675104e1b3bbcced852cdd62eb76c33e6 +size 5007820 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c844abc24389474746872274045959ebb9911ac9 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bf9ae627ae54f63cdb4d7cff0e7bcf1e972be28adf0a4565b0de5e89835185f +size 6101786 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c592b7abdfa769ca5e401e87dd4fbef266320b6e --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8f3f2b1cc94d0ab309da7f30c1ec5099220c41b6437a92fc144b6291af1f705 +size 7181271 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3f59c89918a77dfba59f00206cb1aa1680928cc3 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b81e88e0112403f8ca9b6a3b41b8a9fd644a20a01fe1c27a217f40df42481c54 +size 8256841 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b06ed8690671e5977605dfbfa3cd9682e9b8deda --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92fd5532e640bfc6789b3bc407c12ce579b9c6d3ba7545d16bbed50cc67955bf +size 9343185 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_0.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..088618efa33b3081049a308ec93eae90f3150bcd --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a78a64e9120b0d8df81dfc201b9ebbb0f3191cb5c7c7fdb85af86d4db3f58f63 +size 2799250 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_1.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0a6f5d670f6194f858f5350dc44bc75f96d684ef --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f7e235468da8f0ae1233e8c936613a362fd9b2be54753d6bab2a7ae2aeefb9e +size 5032789 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_2.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ef88b43c422fe142a8c896bd66cc59128dbf8345 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1f40323fabb0169dbf429944a9a5ad23df192e2e3d23977c0b443f1960efe88 +size 7297675 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_3.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..519ccb84cb2e779511162aa1c7ef5095f433130b --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cab33f29a0d7b2a74a4efbf8494c8cf7a70ac3f8ed5b79cef7523c69ae399e05 +size 9567760 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_4.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a3146bcd168b23458e5c7403d90adaf04ffcbbef --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb815ae8ff5e8fbd46aa36b424bbadc91a40ee3fb9c0339c1f2e07926aab9e0a +size 11655151 diff --git a/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_5.jsonl b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d017d6aab5a234078d7fb9ec1bd6409eecfd97fb --- /dev/null +++ b/4b284b6boscar/evaluation/generation/examples.4b284b6boscar_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a05465e430b88982361ac64e8220732a70c8df862ce7e60ab4eaca94815bf06 +size 13897367 diff --git a/4b284b6boscar/evaluation/generation/merged.csv b/4b284b6boscar/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..5daf857204e61b12d80d4b1ee5b173a637c6a662 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/merged.csv @@ -0,0 +1,53 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.00255026898454171 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.00255026898454171 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.21585820859060773 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.21585820859060773 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.2367775628405086 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.2367775628405086 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.24302456733362562 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.24302456733362562 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.24122038943708105 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.24122038943708105 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.243596769826614 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.243596769826614 +e2e_nlg_cleaned,5,average,multiple,0.1971712945021631 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.04812859174134576 +gem_xsum,0,median,rouge2_fmeasure,0.04812859174134576 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.03709731053424962 +gem_xsum,1,median,rouge2_fmeasure,0.03709731053424962 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.04221291192859074 +gem_xsum,2,median,rouge2_fmeasure,0.04221291192859074 +gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.040818146352504275 +gem_xsum,3,median,rouge2_fmeasure,0.040818146352504275 +gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.010127271795302999 +gem_xsum,4,median,rouge2_fmeasure,0.010127271795302999 +gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.0004798845639226407 +gem_xsum,5,median,rouge2_fmeasure,0.0004798845639226407 +gem_xsum,5,average,multiple,0.02981068615265267 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.041333131309197434 +web_nlg_en,0,median,rouge2_fmeasure,0.041333131309197434 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.0689826995733388 +web_nlg_en,1,median,rouge2_fmeasure,0.0689826995733388 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.08528944755820256 +web_nlg_en,2,median,rouge2_fmeasure,0.08528944755820256 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.08972265881218434 +web_nlg_en,3,median,rouge2_fmeasure,0.08972265881218434 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.0960354351793 +web_nlg_en,4,median,rouge2_fmeasure,0.0960354351793 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.10069138588522752 +web_nlg_en,5,median,rouge2_fmeasure,0.10069138588522752 +web_nlg_en,5,average,multiple,0.08034245971957511 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.04061809653735023 +wiki_lingua_en,0,median,rouge2_fmeasure,0.04061809653735023 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.02159662859311345 +wiki_lingua_en,1,median,rouge2_fmeasure,0.02159662859311345 +wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.04630531032723199 +wiki_lingua_en,2,median,rouge2_fmeasure,0.04630531032723199 +wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.04738710642101166 +wiki_lingua_en,3,median,rouge2_fmeasure,0.04738710642101166 +wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.016306136251979797 +wiki_lingua_en,4,median,rouge2_fmeasure,0.016306136251979797 +wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.0024767980328090607 +wiki_lingua_en,5,median,rouge2_fmeasure,0.0024767980328090607 +wiki_lingua_en,5,average,multiple,0.02911501269391603 diff --git a/4b284b6boscar/evaluation/generation/merged.json b/4b284b6boscar/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..48b65e02fee18537b937bd144543a4f920a48ea5 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.36519721260505666, "bleu_stderr": 0.025416271815881648, "rouge1_fmeasure": 0.09543970962631343, "rouge1_fmeasure_stderr": 0.0022861713036904717, "rouge1_precision": 0.0844897373726688, "rouge1_precision_stderr": 0.0033773725125629405, "rouge1_recall": 0.23505539103583917, "rouge1_recall_stderr": 0.004740597986047636, "rouge2_fmeasure": 0.041333131309197434, "rouge2_fmeasure_stderr": 0.0013620781060247143, "rouge2_precision": 0.03592938600180986, "rouge2_precision_stderr": 0.00210536271605171, "rouge2_recall": 0.10454144700558925, "rouge2_recall_stderr": 0.002991020929264074, "rougeL_fmeasure": 0.08838912443491174, "rougeL_fmeasure_stderr": 0.002036320437905252, "rougeL_precision": 0.07802708042033951, "rougeL_precision_stderr": 0.0031165021391665213, "rougeL_recall": 0.22121439829830997, "rougeL_recall_stderr": 0.004485457598638524, "rougeLsum_fmeasure": 0.08923543208494557, "rougeLsum_fmeasure_stderr": 0.002110955534608439, "rougeLsum_precision": 0.07911969436604507, "rougeLsum_precision_stderr": 0.003179215199169328, "rougeLsum_recall": 0.22011099433358053, "rougeLsum_recall_stderr": 0.00444184711183466}}, "1": {"PALM_prompt": {"bleu": 0.5519911539819539, "bleu_stderr": 0.033751880183173925, "rouge1_fmeasure": 0.14277887519027355, "rouge1_fmeasure_stderr": 0.0033087097604432773, "rouge1_precision": 0.12331067244684876, "rouge1_precision_stderr": 0.004082368422597041, "rouge1_recall": 0.31067053294857805, "rouge1_recall_stderr": 0.005182304056477733, "rouge2_fmeasure": 0.0689826995733388, "rouge2_fmeasure_stderr": 0.0021268339152713998, "rouge2_precision": 0.05879868858584044, "rouge2_precision_stderr": 0.0025734193041066717, "rouge2_recall": 0.1541442248192973, "rouge2_recall_stderr": 0.003625807681257247, "rougeL_fmeasure": 0.128307323996298, "rougeL_fmeasure_stderr": 0.00282945845782325, "rougeL_precision": 0.10996896485273867, "rougeL_precision_stderr": 0.0036089432128995863, "rougeL_recall": 0.28822355849070946, "rougeL_recall_stderr": 0.004809494638384607, "rougeLsum_fmeasure": 0.13128489500860036, "rougeLsum_fmeasure_stderr": 0.002907234369940614, "rougeLsum_precision": 0.11297536382690374, "rougeLsum_precision_stderr": 0.003702439687681051, "rougeLsum_recall": 0.2915639206677481, "rougeLsum_recall_stderr": 0.00481999513451822}}, "2": {"PALM_prompt": {"bleu": 0.6339259316631447, "bleu_stderr": 0.03754173222757458, "rouge1_fmeasure": 0.168229929968101, "rouge1_fmeasure_stderr": 0.0038502408432064105, "rouge1_precision": 0.14667562622284316, "rouge1_precision_stderr": 0.004546019252257184, "rouge1_recall": 0.33761348515048895, "rouge1_recall_stderr": 0.005110492360257298, "rouge2_fmeasure": 0.08528944755820256, "rouge2_fmeasure_stderr": 0.0026434056022395106, "rouge2_precision": 0.07392396630393584, "rouge2_precision_stderr": 0.002910921521885995, "rouge2_recall": 0.17359484868950906, "rouge2_recall_stderr": 0.003808651746140846, "rougeL_fmeasure": 0.1496329946991757, "rougeL_fmeasure_stderr": 0.003280688171307162, "rougeL_precision": 0.1288399060647976, "rougeL_precision_stderr": 0.003895576855972721, "rougeL_recall": 0.3103792864337978, "rougeL_recall_stderr": 0.004711801576435388, "rougeLsum_fmeasure": 0.15396679917311523, "rougeLsum_fmeasure_stderr": 0.003394295596411652, "rougeLsum_precision": 0.13322165186378207, "rougeLsum_precision_stderr": 0.004047868682932482, "rougeLsum_recall": 0.3159788458391283, "rougeLsum_recall_stderr": 0.004761168810006645}}, "3": {"PALM_prompt": {"bleu": 0.6987186814977953, "bleu_stderr": 0.03726726363431578, "rouge1_fmeasure": 0.1772674836694056, "rouge1_fmeasure_stderr": 0.004003003892382963, "rouge1_precision": 0.15628268534165624, "rouge1_precision_stderr": 0.004738048768606994, "rouge1_recall": 0.34564779827066666, "rouge1_recall_stderr": 0.005157301361583559, "rouge2_fmeasure": 0.08972265881218434, "rouge2_fmeasure_stderr": 0.00261456940628482, "rouge2_precision": 0.08018351827536892, "rouge2_precision_stderr": 0.0030318772722181717, "rouge2_recall": 0.17720834755097986, "rouge2_recall_stderr": 0.003776236033479815, "rougeL_fmeasure": 0.15629910293144808, "rougeL_fmeasure_stderr": 0.003369049215518736, "rougeL_precision": 0.13619096966611585, "rougeL_precision_stderr": 0.004034691857613383, "rougeL_recall": 0.3156533014362113, "rougeL_recall_stderr": 0.004683382698871321, "rougeLsum_fmeasure": 0.16095302857465682, "rougeLsum_fmeasure_stderr": 0.0034922988800979277, "rougeLsum_precision": 0.14106938481373726, "rougeLsum_precision_stderr": 0.004197327906695634, "rougeLsum_recall": 0.3213841281008155, "rougeLsum_recall_stderr": 0.004741735159952386}}, "4": {"PALM_prompt": {"bleu": 0.8132044575049523, "bleu_stderr": 0.04307840489572349, "rouge1_fmeasure": 0.18550929394489915, "rouge1_fmeasure_stderr": 0.003990007962496953, "rouge1_precision": 0.16347759704430803, "rouge1_precision_stderr": 0.004695561092843388, "rouge1_recall": 0.35695621876500805, "rouge1_recall_stderr": 0.005056764211988934, "rouge2_fmeasure": 0.0960354351793, "rouge2_fmeasure_stderr": 0.0026996759143921977, "rouge2_precision": 0.0858985723582815, "rouge2_precision_stderr": 0.003113033333072909, "rouge2_recall": 0.18657518824555228, "rouge2_recall_stderr": 0.003776015761108268, "rougeL_fmeasure": 0.1644313361150259, "rougeL_fmeasure_stderr": 0.003403269316136382, "rougeL_precision": 0.14325359283567762, "rougeL_precision_stderr": 0.0040366290353170565, "rougeL_recall": 0.3256089247902154, "rougeL_recall_stderr": 0.004566067865026425, "rougeLsum_fmeasure": 0.170863611717608, "rougeLsum_fmeasure_stderr": 0.0035686647188022296, "rougeLsum_precision": 0.15000521793249683, "rougeLsum_precision_stderr": 0.004250104475550225, "rougeLsum_recall": 0.3336933733374621, "rougeLsum_recall_stderr": 0.004658361144305201}}, "5": {"PALM_prompt": {"bleu": 0.8670271385825886, "bleu_stderr": 0.038538862378515414, "rouge1_fmeasure": 0.19328046067966642, "rouge1_fmeasure_stderr": 0.004083786207840732, "rouge1_precision": 0.1746489304105952, "rouge1_precision_stderr": 0.004927634414508578, "rouge1_recall": 0.3570929599577129, "rouge1_recall_stderr": 0.00510044731414704, "rouge2_fmeasure": 0.10069138588522752, "rouge2_fmeasure_stderr": 0.002733147395415775, "rouge2_precision": 0.0924457972411747, "rouge2_precision_stderr": 0.003250827483560766, "rouge2_recall": 0.18760801056883655, "rouge2_recall_stderr": 0.0037583338280536365, "rougeL_fmeasure": 0.1700662023680743, "rougeL_fmeasure_stderr": 0.0034658127030782362, "rougeL_precision": 0.15182781815285762, "rougeL_precision_stderr": 0.004212740165200758, "rougeL_recall": 0.3245349442455857, "rougeL_recall_stderr": 0.004655183104315666, "rougeLsum_fmeasure": 0.17643940357846452, "rougeLsum_fmeasure_stderr": 0.0036208712156513504, "rougeLsum_precision": 0.15860186322431297, "rougeLsum_precision_stderr": 0.004433084191627986, "rougeLsum_recall": 0.33239822166212296, "rougeLsum_recall_stderr": 0.004736491841462652}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 2.7351635777602485, "bleu_stderr": 0.07279508876749892, "rouge1_fmeasure": 0.17320949923781243, "rouge1_fmeasure_stderr": 0.002378543620701129, "rouge1_precision": 0.16375388077824185, "rouge1_precision_stderr": 0.002786961439555472, "rouge1_recall": 0.23310439134422403, "rouge1_recall_stderr": 0.003221909660619021, "rouge2_fmeasure": 0.04061809653735023, "rouge2_fmeasure_stderr": 0.00102349832826798, "rouge2_precision": 0.037266624556334636, "rouge2_precision_stderr": 0.0010454923920460784, "rouge2_recall": 0.055875994550861, "rouge2_recall_stderr": 0.0015220664383122282, "rougeL_fmeasure": 0.1331660737775357, "rougeL_fmeasure_stderr": 0.0017286047933073323, "rougeL_precision": 0.12625756972987834, "rougeL_precision_stderr": 0.00222128685798661, "rougeL_recall": 0.18307142060592155, "rougeL_recall_stderr": 0.002551731495842583, "rougeLsum_fmeasure": 0.1625224304576826, "rougeLsum_fmeasure_stderr": 0.002244458298481143, "rougeLsum_precision": 0.1540530758011259, "rougeLsum_precision_stderr": 0.0026719075792983353, "rougeLsum_recall": 0.2189816298141472, "rougeLsum_recall_stderr": 0.0030502375778628647}}, "1": {"tldr_en": {"bleu": 1.5561631327305139, "bleu_stderr": 0.10739388531682377, "rouge1_fmeasure": 0.1373767191820474, "rouge1_fmeasure_stderr": 0.0018611394817887653, "rouge1_precision": 0.15123352006056198, "rouge1_precision_stderr": 0.0024770673760679054, "rouge1_recall": 0.16716913934962777, "rouge1_recall_stderr": 0.0026348428468133418, "rouge2_fmeasure": 0.02159662859311345, "rouge2_fmeasure_stderr": 0.0008580677013526128, "rouge2_precision": 0.02431061845270688, "rouge2_precision_stderr": 0.0011837421322610725, "rouge2_recall": 0.028272726146180985, "rouge2_recall_stderr": 0.0012762421213196886, "rougeL_fmeasure": 0.10528556398811369, "rougeL_fmeasure_stderr": 0.001369577875772531, "rougeL_precision": 0.11746495228060996, "rougeL_precision_stderr": 0.002010782143494058, "rougeL_recall": 0.12901316733192114, "rougeL_recall_stderr": 0.0020475246892545985, "rougeLsum_fmeasure": 0.13070955427136605, "rougeLsum_fmeasure_stderr": 0.0017418060665744168, "rougeLsum_precision": 0.14415394863180697, "rougeLsum_precision_stderr": 0.0023568768994817993, "rougeLsum_recall": 0.15910651619208108, "rougeLsum_recall_stderr": 0.0024820476138855316}}, "2": {"tldr_en": {"bleu": 2.9166281994554626, "bleu_stderr": 0.10032940921674821, "rouge1_fmeasure": 0.192430862820694, "rouge1_fmeasure_stderr": 0.002247003523313584, "rouge1_precision": 0.22357648926183488, "rouge1_precision_stderr": 0.003403496745004805, "rouge1_recall": 0.23108898978062387, "rouge1_recall_stderr": 0.0030992082209375404, "rouge2_fmeasure": 0.04630531032723199, "rouge2_fmeasure_stderr": 0.001181587468860551, "rouge2_precision": 0.05797035629216586, "rouge2_precision_stderr": 0.0019885419913011878, "rouge2_recall": 0.05603656429890668, "rouge2_recall_stderr": 0.0015489521328666466, "rougeL_fmeasure": 0.14514841535686332, "rougeL_fmeasure_stderr": 0.0016966632675560788, "rougeL_precision": 0.17191667887153705, "rougeL_precision_stderr": 0.002828831061851297, "rougeL_recall": 0.17481639425872558, "rougeL_recall_stderr": 0.00239216857453571, "rougeLsum_fmeasure": 0.18120773649298935, "rougeLsum_fmeasure_stderr": 0.002105112894775109, "rougeLsum_precision": 0.21113970538486854, "rougeLsum_precision_stderr": 0.003241662223820054, "rougeLsum_recall": 0.2176159104822485, "rougeLsum_recall_stderr": 0.0029107305579356567}}, "3": {"tldr_en": {"bleu": 2.779506277921281, "bleu_stderr": 0.12229466738338372, "rouge1_fmeasure": 0.180670243747566, "rouge1_fmeasure_stderr": 0.00257608420712232, "rouge1_precision": 0.22569902995445462, "rouge1_precision_stderr": 0.0038809742804849726, "rouge1_recall": 0.2086225275591831, "rouge1_recall_stderr": 0.003315098779166745, "rouge2_fmeasure": 0.04738710642101166, "rouge2_fmeasure_stderr": 0.0012700610973697954, "rouge2_precision": 0.06416547038499339, "rouge2_precision_stderr": 0.002252696014479526, "rouge2_recall": 0.05497059771205241, "rouge2_recall_stderr": 0.0015764253563869673, "rougeL_fmeasure": 0.1360067434991587, "rougeL_fmeasure_stderr": 0.001953782240535597, "rougeL_precision": 0.1753927608616659, "rougeL_precision_stderr": 0.003290552112282621, "rougeL_recall": 0.1568733502695627, "rougeL_recall_stderr": 0.0025476820762455315, "rougeLsum_fmeasure": 0.1702338547406735, "rougeLsum_fmeasure_stderr": 0.0024243380669135895, "rougeLsum_precision": 0.21377973674170142, "rougeLsum_precision_stderr": 0.003735318958801609, "rougeLsum_recall": 0.19665901832256616, "rougeLsum_recall_stderr": 0.0031297483130912885}}, "4": {"tldr_en": {"bleu": 0.14389085369232565, "bleu_stderr": 0.018449228139014652, "rouge1_fmeasure": 0.06135106282233744, "rouge1_fmeasure_stderr": 0.002155687684091724, "rouge1_precision": 0.08172885429788375, "rouge1_precision_stderr": 0.0031593114449411995, "rouge1_recall": 0.06880607657481164, "rouge1_recall_stderr": 0.0025890657802543843, "rouge2_fmeasure": 0.016306136251979797, "rouge2_fmeasure_stderr": 0.0008516499355170893, "rouge2_precision": 0.02333833752926271, "rouge2_precision_stderr": 0.0015030616397154965, "rouge2_recall": 0.018396239255635764, "rouge2_recall_stderr": 0.001045632678195372, "rougeL_fmeasure": 0.047481918108786006, "rougeL_fmeasure_stderr": 0.001679846765086699, "rougeL_precision": 0.06522015073123037, "rougeL_precision_stderr": 0.0026414107544845554, "rougeL_recall": 0.053199755807901684, "rougeL_recall_stderr": 0.002028938653804975, "rougeLsum_fmeasure": 0.05722336037021286, "rougeLsum_fmeasure_stderr": 0.002006378468825137, "rougeLsum_precision": 0.07691174733451789, "rougeLsum_precision_stderr": 0.0030091759153711927, "rougeLsum_recall": 0.06407113817992571, "rougeLsum_recall_stderr": 0.002407483027587739}}, "5": {"tldr_en": {"bleu": 6.788927091230416e-13, "bleu_stderr": 5.3190288411298046e-12, "rouge1_fmeasure": 0.009463053541826822, "rouge1_fmeasure_stderr": 0.0009145339358699636, "rouge1_precision": 0.012848959719309508, "rouge1_precision_stderr": 0.0013119884844163163, "rouge1_recall": 0.010311420129546226, "rouge1_recall_stderr": 0.0010848349785527766, "rouge2_fmeasure": 0.0024767980328090607, "rouge2_fmeasure_stderr": 0.00033878203552135646, "rouge2_precision": 0.00383713070490352, "rouge2_precision_stderr": 0.000679000049070121, "rouge2_recall": 0.002691389750432684, "rouge2_recall_stderr": 0.00039328749507485294, "rougeL_fmeasure": 0.007623920574636888, "rougeL_fmeasure_stderr": 0.00074262701496866, "rougeL_precision": 0.010677492926423284, "rougeL_precision_stderr": 0.0011412324336550364, "rougeL_recall": 0.008217313076562338, "rougeL_recall_stderr": 0.0008636920884600956, "rougeLsum_fmeasure": 0.0089451879827669, "rougeLsum_fmeasure_stderr": 0.0008630902539268249, "rougeLsum_precision": 0.012210240397913602, "rougeLsum_precision_stderr": 0.0012594872826179838, "rougeLsum_recall": 0.00974458097545787, "rougeLsum_recall_stderr": 0.001023511123119965}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 0.15232871634896603, "bleu_stderr": 0.020812270261486823, "rouge1_fmeasure": 0.020954271163547446, "rouge1_fmeasure_stderr": 0.0007980489867592098, "rouge1_precision": 0.01770379177388514, "rouge1_precision_stderr": 0.0007712828154957143, "rouge1_recall": 0.028491661886720938, "rouge1_recall_stderr": 0.0010891578916398857, "rouge2_fmeasure": 0.00255026898454171, "rouge2_fmeasure_stderr": 0.0003936972479245331, "rouge2_precision": 0.002501895673880381, "rouge2_precision_stderr": 0.00042732541832556033, "rouge2_recall": 0.0034077667682669804, "rouge2_recall_stderr": 0.0005511526902650941, "rougeL_fmeasure": 0.020230168243995296, "rougeL_fmeasure_stderr": 0.0006931916013766407, "rougeL_precision": 0.01712932032724213, "rougeL_precision_stderr": 0.0007023823982565856, "rougeL_recall": 0.027450404231693933, "rougeL_recall_stderr": 0.0009294384582174001, "rougeLsum_fmeasure": 0.020282346611517486, "rougeLsum_fmeasure_stderr": 0.000767526686930157, "rougeLsum_precision": 0.01715807340633443, "rougeLsum_precision_stderr": 0.0007495810339305068, "rougeLsum_recall": 0.027584765389295527, "rougeLsum_recall_stderr": 0.001051599270290686}}, "1": {"generate_text_restaurant": {"bleu": 11.955740880134837, "bleu_stderr": 0.15642139786964473, "rouge1_fmeasure": 0.4567598668167415, "rouge1_fmeasure_stderr": 0.0023932905161546223, "rouge1_precision": 0.5523543366276142, "rouge1_precision_stderr": 0.0032273194133200615, "rouge1_recall": 0.42797708934193157, "rouge1_recall_stderr": 0.0030241470346410635, "rouge2_fmeasure": 0.21585820859060773, "rouge2_fmeasure_stderr": 0.0020692552291630066, "rouge2_precision": 0.2643215040772804, "rouge2_precision_stderr": 0.0026722105312840154, "rouge2_recall": 0.20215308199057408, "rouge2_recall_stderr": 0.0022121806698831336, "rougeL_fmeasure": 0.3344463176631742, "rougeL_fmeasure_stderr": 0.0021371990381405573, "rougeL_precision": 0.40750234018593817, "rougeL_precision_stderr": 0.002971833950463029, "rougeL_recall": 0.3125157249212724, "rougeL_recall_stderr": 0.0025035354662693373, "rougeLsum_fmeasure": 0.37643903958132885, "rougeLsum_fmeasure_stderr": 0.0023685867771283033, "rougeLsum_precision": 0.45652280658634536, "rougeLsum_precision_stderr": 0.0031709106886728365, "rougeLsum_recall": 0.3523732297311478, "rougeLsum_recall_stderr": 0.002796550103045126}}, "2": {"generate_text_restaurant": {"bleu": 13.897352692245587, "bleu_stderr": 0.14980000038720503, "rouge1_fmeasure": 0.4802344330712051, "rouge1_fmeasure_stderr": 0.002320930303516199, "rouge1_precision": 0.561794916535469, "rouge1_precision_stderr": 0.003099458635885747, "rouge1_recall": 0.4567589519097586, "rouge1_recall_stderr": 0.0030026914172325615, "rouge2_fmeasure": 0.2367775628405086, "rouge2_fmeasure_stderr": 0.0020846614978106194, "rouge2_precision": 0.2792219908408161, "rouge2_precision_stderr": 0.002614017045402319, "rouge2_recall": 0.22598550083511856, "rouge2_recall_stderr": 0.002301745671244508, "rougeL_fmeasure": 0.351524532586077, "rougeL_fmeasure_stderr": 0.002116811888824175, "rougeL_precision": 0.4125697759457242, "rougeL_precision_stderr": 0.0028156824620878228, "rougeL_recall": 0.3342012776517918, "rougeL_recall_stderr": 0.0025457481527686697, "rougeLsum_fmeasure": 0.39951857535439594, "rougeLsum_fmeasure_stderr": 0.0023615361382931218, "rougeLsum_precision": 0.4679766836272037, "rougeLsum_precision_stderr": 0.003077550404036877, "rougeLsum_recall": 0.37978796737629206, "rougeLsum_recall_stderr": 0.002832179161262596}}, "3": {"generate_text_restaurant": {"bleu": 14.426686249425238, "bleu_stderr": 0.07922124112239044, "rouge1_fmeasure": 0.48630114866568, "rouge1_fmeasure_stderr": 0.0022963886540455164, "rouge1_precision": 0.5680260430312276, "rouge1_precision_stderr": 0.0030913554764194547, "rouge1_recall": 0.46062214346005564, "rouge1_recall_stderr": 0.002938192474222987, "rouge2_fmeasure": 0.24302456733362562, "rouge2_fmeasure_stderr": 0.0021567426223923106, "rouge2_precision": 0.2861172769387419, "rouge2_precision_stderr": 0.002690477373583243, "rouge2_recall": 0.2310837031392793, "rouge2_recall_stderr": 0.0023655149673605107, "rougeL_fmeasure": 0.35690884478009743, "rougeL_fmeasure_stderr": 0.0021650316694958355, "rougeL_precision": 0.41780470464632935, "rougeL_precision_stderr": 0.00284479912148554, "rougeL_recall": 0.3380514128610829, "rougeL_recall_stderr": 0.002554824733679187, "rougeLsum_fmeasure": 0.4059984680960094, "rougeLsum_fmeasure_stderr": 0.0023597610029612243, "rougeLsum_precision": 0.47406884298114293, "rougeLsum_precision_stderr": 0.003048747619228675, "rougeLsum_recall": 0.3848877688500459, "rougeLsum_recall_stderr": 0.002821475089819001}}, "4": {"generate_text_restaurant": {"bleu": 14.2425385270368, "bleu_stderr": 0.12070465932038754, "rouge1_fmeasure": 0.48405302137560413, "rouge1_fmeasure_stderr": 0.0023511056226272723, "rouge1_precision": 0.5674339183550579, "rouge1_precision_stderr": 0.0031765208159065333, "rouge1_recall": 0.45589676217731373, "rouge1_recall_stderr": 0.0028927956512816914, "rouge2_fmeasure": 0.24122038943708105, "rouge2_fmeasure_stderr": 0.002185560838559176, "rouge2_precision": 0.28512193921853746, "rouge2_precision_stderr": 0.0027192588682938886, "rouge2_recall": 0.22748223092470107, "rouge2_recall_stderr": 0.002317019903101863, "rougeL_fmeasure": 0.35621729860823614, "rougeL_fmeasure_stderr": 0.00219679008764647, "rougeL_precision": 0.41854952516509386, "rougeL_precision_stderr": 0.0028845475934422132, "rougeL_recall": 0.3354088230242437, "rougeL_recall_stderr": 0.0025175251927694814, "rougeLsum_fmeasure": 0.405571228031194, "rougeLsum_fmeasure_stderr": 0.002421046900033825, "rougeLsum_precision": 0.4751881399496292, "rougeLsum_precision_stderr": 0.003113603195689234, "rougeLsum_recall": 0.3821462060193808, "rougeLsum_recall_stderr": 0.002793602104629368}}, "5": {"generate_text_restaurant": {"bleu": 14.361008320584343, "bleu_stderr": 0.1560368843029399, "rouge1_fmeasure": 0.48445698386739383, "rouge1_fmeasure_stderr": 0.002342258145013874, "rouge1_precision": 0.5690777901256877, "rouge1_precision_stderr": 0.0032322208735574096, "rouge1_recall": 0.45484384858111365, "rouge1_recall_stderr": 0.002842522185270529, "rouge2_fmeasure": 0.243596769826614, "rouge2_fmeasure_stderr": 0.002164197721918074, "rouge2_precision": 0.28959806457707354, "rouge2_precision_stderr": 0.002772700376334683, "rouge2_recall": 0.2287344578632653, "rouge2_recall_stderr": 0.0022822820197528288, "rougeL_fmeasure": 0.3585342364636756, "rougeL_fmeasure_stderr": 0.0021296678714575203, "rougeL_precision": 0.4222734045194765, "rougeL_precision_stderr": 0.002886687722686102, "rougeL_recall": 0.3365984183167644, "rougeL_recall_stderr": 0.002444470426579007, "rougeLsum_fmeasure": 0.4072114109794734, "rougeLsum_fmeasure_stderr": 0.0023913662984892826, "rougeLsum_precision": 0.47857494456631217, "rougeLsum_precision_stderr": 0.0031621123336196618, "rougeLsum_recall": 0.38225762195387136, "rougeLsum_recall_stderr": 0.0027342556691813064}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 1.9735502840922572, "bleu_stderr": 0.07275406618552088, "rouge1_fmeasure": 0.1994811520035836, "rouge1_fmeasure_stderr": 0.002984688412674603, "rouge1_precision": 0.14683911932801988, "rouge1_precision_stderr": 0.0024209614448014935, "rouge1_recall": 0.33232051267525825, "rouge1_recall_stderr": 0.004965206416592606, "rouge2_fmeasure": 0.04812859174134576, "rouge2_fmeasure_stderr": 0.001607211256469432, "rouge2_precision": 0.0347877835737417, "rouge2_precision_stderr": 0.0011768705530675132, "rouge2_recall": 0.08224966786374009, "rouge2_recall_stderr": 0.0027934031626812928, "rougeL_fmeasure": 0.146380284799072, "rougeL_fmeasure_stderr": 0.0022388632798941263, "rougeL_precision": 0.10790546336960771, "rougeL_precision_stderr": 0.0018864163308328482, "rougeL_recall": 0.2448853816068894, "rougeL_recall_stderr": 0.0038264085032181728, "rougeLsum_fmeasure": 0.1589223000999379, "rougeLsum_fmeasure_stderr": 0.002474373290963512, "rougeLsum_precision": 0.1169016398885232, "rougeLsum_precision_stderr": 0.002030057097593571, "rougeLsum_recall": 0.2661904377997672, "rougeLsum_recall_stderr": 0.004231721336986767}}, "1": {"article_DOC_summary": {"bleu": 1.638300206290867, "bleu_stderr": 0.07822743390841481, "rouge1_fmeasure": 0.19188402550566547, "rouge1_fmeasure_stderr": 0.002827706721355569, "rouge1_precision": 0.1587565929424201, "rouge1_precision_stderr": 0.002734028004150954, "rouge1_recall": 0.2839429315342853, "rouge1_recall_stderr": 0.004504901492577771, "rouge2_fmeasure": 0.03709731053424962, "rouge2_fmeasure_stderr": 0.0015618279370815137, "rouge2_precision": 0.029846851134275015, "rouge2_precision_stderr": 0.0013392701936661123, "rouge2_recall": 0.0574725840470226, "rouge2_recall_stderr": 0.00246069245408357, "rougeL_fmeasure": 0.14286744054243364, "rougeL_fmeasure_stderr": 0.0021068352185527133, "rougeL_precision": 0.1181498323911531, "rougeL_precision_stderr": 0.002030579033137931, "rougeL_recall": 0.2124355930003259, "rougeL_recall_stderr": 0.003465890162302496, "rougeLsum_fmeasure": 0.1487243376167721, "rougeLsum_fmeasure_stderr": 0.0022534985476107437, "rougeLsum_precision": 0.12248206747333056, "rougeLsum_precision_stderr": 0.0020938304134755963, "rougeLsum_recall": 0.22210978407966295, "rougeLsum_recall_stderr": 0.00378568398661764}}, "2": {"article_DOC_summary": {"bleu": 1.8180132235300948, "bleu_stderr": 0.10800461107815497, "rouge1_fmeasure": 0.20016621421606, "rouge1_fmeasure_stderr": 0.0029081034648420524, "rouge1_precision": 0.17315356567023985, "rouge1_precision_stderr": 0.0032567814817309163, "rouge1_recall": 0.28736976708095296, "rouge1_recall_stderr": 0.004257004996623704, "rouge2_fmeasure": 0.04221291192859074, "rouge2_fmeasure_stderr": 0.0017897129758792792, "rouge2_precision": 0.03675600130879838, "rouge2_precision_stderr": 0.0018004136622862172, "rouge2_recall": 0.061344714470415035, "rouge2_recall_stderr": 0.0025169166680391974, "rougeL_fmeasure": 0.15402918525247972, "rougeL_fmeasure_stderr": 0.002267194194181029, "rougeL_precision": 0.13304195544493516, "rougeL_precision_stderr": 0.0025505916245897793, "rougeL_recall": 0.22240633657661427, "rougeL_recall_stderr": 0.0033618144117980413, "rougeLsum_fmeasure": 0.15727848493672736, "rougeLsum_fmeasure_stderr": 0.002372060789387804, "rougeLsum_precision": 0.13553932746039002, "rougeLsum_precision_stderr": 0.002600318961574337, "rougeLsum_recall": 0.22810281420861347, "rougeLsum_recall_stderr": 0.0036392464751532154}}, "3": {"article_DOC_summary": {"bleu": 1.8375265128691776, "bleu_stderr": 0.11380329430209277, "rouge1_fmeasure": 0.19568743419032586, "rouge1_fmeasure_stderr": 0.0032421572082825824, "rouge1_precision": 0.17229167511698984, "rouge1_precision_stderr": 0.0035468885296608124, "rouge1_recall": 0.2727682959834323, "rouge1_recall_stderr": 0.004455577411908, "rouge2_fmeasure": 0.040818146352504275, "rouge2_fmeasure_stderr": 0.001758412694246694, "rouge2_precision": 0.03640068625403459, "rouge2_precision_stderr": 0.00180003629009263, "rouge2_recall": 0.05714643040549625, "rouge2_recall_stderr": 0.002391106418603193, "rougeL_fmeasure": 0.14751313359534127, "rougeL_fmeasure_stderr": 0.002427984258029977, "rougeL_precision": 0.12934549628784311, "rougeL_precision_stderr": 0.0026499682938759214, "rougeL_recall": 0.2079367842088016, "rougeL_recall_stderr": 0.003506259792687054, "rougeLsum_fmeasure": 0.15176201376572815, "rougeLsum_fmeasure_stderr": 0.002540088784293334, "rougeLsum_precision": 0.13258510136274942, "rougeLsum_precision_stderr": 0.0026954493602500585, "rougeLsum_recall": 0.21466898986359226, "rougeLsum_recall_stderr": 0.003760210367462346}}, "4": {"article_DOC_summary": {"bleu": 0.46372311709585096, "bleu_stderr": 0.09429799136651668, "rouge1_fmeasure": 0.050905820351251574, "rouge1_fmeasure_stderr": 0.002936649188749722, "rouge1_precision": 0.049854157064987935, "rouge1_precision_stderr": 0.0030861147190811536, "rouge1_recall": 0.06666637829573964, "rouge1_recall_stderr": 0.003951494050861984, "rouge2_fmeasure": 0.010127271795302999, "rouge2_fmeasure_stderr": 0.0010361348734861174, "rouge2_precision": 0.009568873692323173, "rouge2_precision_stderr": 0.0010725443721543572, "rouge2_recall": 0.01374863634918288, "rouge2_recall_stderr": 0.0014545824225490266, "rougeL_fmeasure": 0.03882864608439493, "rougeL_fmeasure_stderr": 0.0022207318687529937, "rougeL_precision": 0.03859045897117773, "rougeL_precision_stderr": 0.0024258515639221765, "rougeL_recall": 0.05102740916511275, "rougeL_recall_stderr": 0.003040146906444265, "rougeLsum_fmeasure": 0.03984498899321002, "rougeLsum_fmeasure_stderr": 0.0023064027916115458, "rougeLsum_precision": 0.039682572877387905, "rougeLsum_precision_stderr": 0.0025137153001535515, "rougeLsum_recall": 0.05223871369062228, "rougeLsum_recall_stderr": 0.003168762214579924}}, "5": {"article_DOC_summary": {"bleu": 1.1113865171956142e-43, "bleu_stderr": 1.4470133621020118e-34, "rouge1_fmeasure": 0.003113321950673498, "rouge1_fmeasure_stderr": 0.0008689581396887578, "rouge1_precision": 0.00375709923706833, "rouge1_precision_stderr": 0.001067372185961691, "rouge1_recall": 0.0027436329216451176, "rouge1_recall_stderr": 0.0007640456916008605, "rouge2_fmeasure": 0.0004798845639226407, "rouge2_fmeasure_stderr": 0.00020204272629620264, "rouge2_precision": 0.0005930059273566488, "rouge2_precision_stderr": 0.0002584437833429403, "rouge2_recall": 0.000410764780909065, "rouge2_recall_stderr": 0.00016925078259344875, "rougeL_fmeasure": 0.002297229116490886, "rougeL_fmeasure_stderr": 0.0006358236397526091, "rougeL_precision": 0.002781684748525154, "rougeL_precision_stderr": 0.0007911433597366938, "rougeL_recall": 0.002025647482597874, "rougeL_recall_stderr": 0.0005582402498199304, "rougeLsum_fmeasure": 0.0026114688524966553, "rougeLsum_fmeasure_stderr": 0.0007315944509355694, "rougeLsum_precision": 0.0031454079965436295, "rougeLsum_precision_stderr": 0.0008989173681249037, "rougeLsum_recall": 0.002308538269140517, "rougeLsum_recall_stderr": 0.0006456848704500759}}}} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e5be8d2b3deeaa68ad6222714216a1365359d9e5 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.36519721260505666, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.025416271815881648 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0844897373726688, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0033773725125629405 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.23505539103583917, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004740597986047636 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09543970962631343, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0022861713036904717 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03592938600180986, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.00210536271605171 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.10454144700558925, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.002991020929264074 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.041333131309197434, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0013620781060247143 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07802708042033951, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0031165021391665213 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.22121439829830997, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004485457598638524 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.08838912443491174, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.002036320437905252 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07911969436604507, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.003179215199169328 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.22011099433358053, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00444184711183466 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.08923543208494557, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002110955534608439 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..52ee7a15858cb3bde2fd54be5b201133381d702c --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5519911539819539, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.033751880183173925 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.12331067244684876, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004082368422597041 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.31067053294857805, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005182304056477733 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.14277887519027355, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0033087097604432773 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.05879868858584044, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0025734193041066717 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1541442248192973, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003625807681257247 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.0689826995733388, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0021268339152713998 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.10996896485273867, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0036089432128995863 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.28822355849070946, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004809494638384607 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.128307323996298, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.00282945845782325 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.11297536382690374, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.003702439687681051 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2915639206677481, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00481999513451822 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.13128489500860036, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002907234369940614 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..bd97df74b9503d246349393bbf010597a113a4db --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6339259316631447, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03754173222757458 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.14667562622284316, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004546019252257184 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.33761348515048895, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005110492360257298 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.168229929968101, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0038502408432064105 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.07392396630393584, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.002910921521885995 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.17359484868950906, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003808651746140846 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.08528944755820256, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0026434056022395106 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.1288399060647976, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.003895576855972721 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3103792864337978, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004711801576435388 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1496329946991757, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003280688171307162 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.13322165186378207, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004047868682932482 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3159788458391283, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004761168810006645 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.15396679917311523, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.003394295596411652 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..b80b40a6ddba9eed7754e9c98e5a6ca7aad324cb --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6987186814977953, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03726726363431578 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.15628268534165624, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004738048768606994 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.34564779827066666, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005157301361583559 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.1772674836694056, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004003003892382963 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.08018351827536892, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0030318772722181717 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.17720834755097986, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003776236033479815 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.08972265881218434, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00261456940628482 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.13619096966611585, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004034691857613383 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3156533014362113, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004683382698871321 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.15629910293144808, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003369049215518736 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.14106938481373726, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004197327906695634 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3213841281008155, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004741735159952386 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.16095302857465682, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0034922988800979277 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..2bd827d98437e63cfc65f165613e3833f7b44f1e --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.8132044575049523, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04307840489572349 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.16347759704430803, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004695561092843388 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.35695621876500805, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005056764211988934 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.18550929394489915, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.003990007962496953 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.0858985723582815, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.003113033333072909 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.18657518824555228, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003776015761108268 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.0960354351793, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0026996759143921977 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.14325359283567762, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0040366290353170565 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3256089247902154, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004566067865026425 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1644313361150259, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003403269316136382 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.15000521793249683, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004250104475550225 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3336933733374621, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004658361144305201 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.170863611717608, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0035686647188022296 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..29e61db6eb60da3744166de442701e7893b69e71 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.8670271385825886, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.038538862378515414 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.1746489304105952, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004927634414508578 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3570929599577129, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00510044731414704 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.19328046067966642, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004083786207840732 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.0924457972411747, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.003250827483560766 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.18760801056883655, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0037583338280536365 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.10069138588522752, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.002733147395415775 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.15182781815285762, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004212740165200758 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3245349442455857, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004655183104315666 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1700662023680743, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0034658127030782362 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.15860186322431297, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004433084191627986 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.33239822166212296, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004736491841462652 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.17643940357846452, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0036208712156513504 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8c82d6f115c1e72a84306562421b3f8be45c5a --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.16375388077824185, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002786961439555472 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.23310439134422403, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.003221909660619021 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17320949923781243, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002378543620701129 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.037266624556334636, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0010454923920460784 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.055875994550861, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015220664383122282 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04061809653735023, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00102349832826798 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.12625756972987834, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.00222128685798661 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.18307142060592155, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002551731495842583 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1331660737775357, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0017286047933073323 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1540530758011259, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0026719075792983353 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2189816298141472, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0030502375778628647 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1625224304576826, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002244458298481143 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.7351635777602485, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.07279508876749892 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..7335b71be18e866a5f598b7399843ae30a1919a1 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.15123352006056198, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0024770673760679054 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.16716913934962777, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0026348428468133418 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1373767191820474, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018611394817887653 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.02431061845270688, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0011837421322610725 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.028272726146180985, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012762421213196886 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.02159662859311345, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008580677013526128 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11746495228060996, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002010782143494058 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.12901316733192114, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0020475246892545985 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.10528556398811369, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001369577875772531 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.14415394863180697, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0023568768994817993 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.15910651619208108, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0024820476138855316 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.13070955427136605, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017418060665744168 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.5561631327305139, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.10739388531682377 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..caadd221f37ab1ce20feeb8133f21ef792d7c822 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.22357648926183488, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.003403496745004805 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.23108898978062387, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0030992082209375404 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.192430862820694, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002247003523313584 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.05797035629216586, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0019885419913011878 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05603656429890668, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015489521328666466 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04630531032723199, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001181587468860551 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.17191667887153705, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002828831061851297 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.17481639425872558, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00239216857453571 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.14514841535686332, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016966632675560788 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.21113970538486854, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.003241662223820054 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2176159104822485, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0029107305579356567 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.18120773649298935, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002105112894775109 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.9166281994554626, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.10032940921674821 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..898982b1b16ce2b4cde41b799e369e65b93d83da --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.22569902995445462, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0038809742804849726 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2086225275591831, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.003315098779166745 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.180670243747566, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.00257608420712232 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.06416547038499339, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.002252696014479526 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05497059771205241, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015764253563869673 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04738710642101166, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012700610973697954 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1753927608616659, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.003290552112282621 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1568733502695627, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0025476820762455315 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1360067434991587, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001953782240535597 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.21377973674170142, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.003735318958801609 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.19665901832256616, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0031297483130912885 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1702338547406735, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0024243380669135895 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.779506277921281, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.12229466738338372 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..7c3ca4a2bdbf17ed76fdc4ea67b93e039473c746 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.08172885429788375, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0031593114449411995 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.06880607657481164, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0025890657802543843 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.06135106282233744, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002155687684091724 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.02333833752926271, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0015030616397154965 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.018396239255635764, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001045632678195372 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.016306136251979797, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008516499355170893 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.06522015073123037, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0026414107544845554 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.053199755807901684, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002028938653804975 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.047481918108786006, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001679846765086699 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.07691174733451789, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0030091759153711927 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.06407113817992571, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002407483027587739 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.05722336037021286, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002006378468825137 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.14389085369232565, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.018449228139014652 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..70d86551ec8fb94f13a15cab01422136f1ed94c9 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.012848959719309508, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013119884844163163 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.010311420129546226, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0010848349785527766 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.009463053541826822, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0009145339358699636 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.00383713070490352, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000679000049070121 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.002691389750432684, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.00039328749507485294 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0024767980328090607, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00033878203552135646 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.010677492926423284, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011412324336550364 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.008217313076562338, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0008636920884600956 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.007623920574636888, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.00074262701496866 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.012210240397913602, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012594872826179838 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.00974458097545787, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.001023511123119965 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.0089451879827669, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0008630902539268249 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 6.788927091230416e-13, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 5.3190288411298046e-12 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..a2159d0cc84a9e1e5b765b25b1c99360e5c8a331 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 0.15232871634896603, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.020812270261486823 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.01770379177388514, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0007712828154957143 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.028491661886720938, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0010891578916398857 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.020954271163547446, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0007980489867592098 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.002501895673880381, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.00042732541832556033 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.0034077667682669804, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0005511526902650941 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.00255026898454171, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0003936972479245331 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.01712932032724213, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0007023823982565856 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.027450404231693933, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0009294384582174001 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.020230168243995296, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0006931916013766407 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.01715807340633443, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0007495810339305068 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.027584765389295527, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.001051599270290686 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.020282346611517486, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.000767526686930157 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..e78b062bc13e20366fbc99c57f4d84f0bbe7f26c --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.955740880134837, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.15642139786964473 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5523543366276142, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032273194133200615 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.42797708934193157, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0030241470346410635 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4567598668167415, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0023932905161546223 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2643215040772804, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026722105312840154 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.20215308199057408, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022121806698831336 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.21585820859060773, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020692552291630066 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.40750234018593817, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002971833950463029 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3125157249212724, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025035354662693373 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3344463176631742, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021371990381405573 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.45652280658634536, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031709106886728365 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3523732297311478, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002796550103045126 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.37643903958132885, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023685867771283033 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..f0b9389dbd63a1844d54e8849453bf6d8a58b0a3 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.897352692245587, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.14980000038720503 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.561794916535469, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003099458635885747 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4567589519097586, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0030026914172325615 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4802344330712051, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002320930303516199 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2792219908408161, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002614017045402319 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.22598550083511856, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002301745671244508 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2367775628405086, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020846614978106194 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4125697759457242, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0028156824620878228 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3342012776517918, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025457481527686697 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.351524532586077, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002116811888824175 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4679766836272037, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003077550404036877 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.37978796737629206, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002832179161262596 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.39951857535439594, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023615361382931218 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..4e4ea0e15371ce3c38f5453a133ed7440d92fa79 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.426686249425238, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.07922124112239044 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5680260430312276, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0030913554764194547 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.46062214346005564, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002938192474222987 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.48630114866568, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022963886540455164 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2861172769387419, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002690477373583243 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2310837031392793, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023655149673605107 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.24302456733362562, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0021567426223923106 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.41780470464632935, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.00284479912148554 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3380514128610829, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002554824733679187 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.35690884478009743, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021650316694958355 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.47406884298114293, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003048747619228675 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3848877688500459, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002821475089819001 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4059984680960094, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023597610029612243 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..60bd1504c9d78941d30637263dd7553775beb78a --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.2425385270368, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.12070465932038754 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5674339183550579, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031765208159065333 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.45589676217731373, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028927956512816914 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.48405302137560413, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0023511056226272723 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.28512193921853746, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0027192588682938886 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.22748223092470107, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002317019903101863 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.24122038943708105, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002185560838559176 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.41854952516509386, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0028845475934422132 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3354088230242437, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025175251927694814 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.35621729860823614, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.00219679008764647 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4751881399496292, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003113603195689234 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3821462060193808, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002793602104629368 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.405571228031194, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002421046900033825 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..835de61a6b925dc131ab88b610cf8b7cce5f2e33 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.361008320584343, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1560368843029399 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5690777901256877, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032322208735574096 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.45484384858111365, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002842522185270529 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.48445698386739383, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002342258145013874 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.28959806457707354, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002772700376334683 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2287344578632653, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022822820197528288 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.243596769826614, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002164197721918074 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4222734045194765, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002886687722686102 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3365984183167644, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002444470426579007 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3585342364636756, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021296678714575203 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.47857494456631217, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031621123336196618 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.38225762195387136, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027342556691813064 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4072114109794734, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023913662984892826 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_gem_xsum_article_DOC_summary_0.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..189ca787c9e77e4a7d92ceab614d6217d9bd0032 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.14683911932801988, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0024209614448014935 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.33232051267525825, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004965206416592606 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1994811520035836, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002984688412674603 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0347877835737417, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0011768705530675132 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.08224966786374009, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0027934031626812928 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04812859174134576, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001607211256469432 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10790546336960771, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0018864163308328482 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2448853816068894, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0038264085032181728 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.146380284799072, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0022388632798941263 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.1169016398885232, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.002030057097593571 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2661904377997672, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.004231721336986767 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1589223000999379, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002474373290963512 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.9735502840922572, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07275406618552088 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_gem_xsum_article_DOC_summary_1.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..f884e14cec61ac92bf17e92558839c287fd667d9 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1587565929424201, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002734028004150954 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2839429315342853, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004504901492577771 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.19188402550566547, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002827706721355569 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.029846851134275015, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0013392701936661123 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0574725840470226, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00246069245408357 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03709731053424962, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0015618279370815137 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.1181498323911531, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.002030579033137931 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2124355930003259, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003465890162302496 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14286744054243364, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0021068352185527133 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.12248206747333056, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0020938304134755963 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.22210978407966295, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.00378568398661764 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1487243376167721, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0022534985476107437 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.638300206290867, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07822743390841481 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_gem_xsum_article_DOC_summary_2.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..24df1f32745557bf74b597440a10b22f79c134ae --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.17315356567023985, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0032567814817309163 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.28736976708095296, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004257004996623704 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.20016621421606, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0029081034648420524 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03675600130879838, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0018004136622862172 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.061344714470415035, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0025169166680391974 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04221291192859074, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0017897129758792792 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.13304195544493516, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0025505916245897793 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.22240633657661427, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0033618144117980413 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.15402918525247972, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002267194194181029 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.13553932746039002, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.002600318961574337 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.22810281420861347, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0036392464751532154 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.15727848493672736, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002372060789387804 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.8180132235300948, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.10800461107815497 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_gem_xsum_article_DOC_summary_3.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..7bb52f794fdb9e1a2bf434145e61e92480739667 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.17229167511698984, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0035468885296608124 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2727682959834323, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004455577411908 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.19568743419032586, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0032421572082825824 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03640068625403459, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00180003629009263 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.05714643040549625, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002391106418603193 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.040818146352504275, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001758412694246694 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.12934549628784311, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0026499682938759214 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2079367842088016, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003506259792687054 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14751313359534127, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002427984258029977 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.13258510136274942, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0026954493602500585 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.21466898986359226, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003760210367462346 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.15176201376572815, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002540088784293334 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.8375265128691776, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.11380329430209277 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_gem_xsum_article_DOC_summary_4.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..8b13cd837195dfa8a6f2c26fc4fa3b0b0f20ead7 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.049854157064987935, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0030861147190811536 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.06666637829573964, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003951494050861984 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.050905820351251574, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002936649188749722 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.009568873692323173, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010725443721543572 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.01374863634918288, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0014545824225490266 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.010127271795302999, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0010361348734861174 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.03859045897117773, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0024258515639221765 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.05102740916511275, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003040146906444265 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.03882864608439493, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0022207318687529937 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.039682572877387905, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0025137153001535515 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.05223871369062228, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003168762214579924 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.03984498899321002, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0023064027916115458 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.46372311709585096, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09429799136651668 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_gem_xsum_article_DOC_summary_5.json b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..d52a61d99c1455b6135d2dd2cbb7d9f4f70414d8 --- /dev/null +++ b/4b284b6boscar/evaluation/generation/slim.4b284b6boscar_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.00375709923706833, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.001067372185961691 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.0027436329216451176, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0007640456916008605 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.003113321950673498, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0008689581396887578 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0005930059273566488, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0002584437833429403 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.000410764780909065, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00016925078259344875 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0004798845639226407, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00020204272629620264 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.002781684748525154, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0007911433597366938 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.002025647482597874, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0005582402498199304 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.002297229116490886, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0006358236397526091 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0031454079965436295, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0008989173681249037 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.002308538269140517, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0006456848704500759 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0026114688524966553, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0007315944509355694 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.1113865171956142e-43, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 1.4470133621020118e-34 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-oscar-repetitions/4b284b6boscar/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/rankeval/4b284b6boscar_0.csv b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..d5fd276dd3f080b47073f48714203b13d1663580 --- /dev/null +++ b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.346,0.01505026612756445,0 +anli_r2,acc,0.322,0.014782913600996664,0 +anli_r3,acc,0.33916666666666667,0.013672343491681822,0 +arc_challenge,acc,0.23890784982935154,0.012461071376316614,0 +arc_challenge,acc_norm,0.28071672354948807,0.013131238126975578,0 +arc_easy,acc,0.5286195286195287,0.010242962617927195,0 +arc_easy,acc_norm,0.4671717171717172,0.01023764577885386,0 +boolq,acc,0.5296636085626911,0.008729651343606142,1 +cb,acc,0.21428571428571427,0.055328333517248834,1 +cb,f1,0.14579916165482049,,1 +copa,acc,0.71,0.045604802157206845,0 +hellaswag,acc,0.3952399920334595,0.00487903001059892,0 +hellaswag,acc_norm,0.48884684325831507,0.004988539870174637,0 +piqa,acc,0.7110990206746464,0.010575111841364901,0 +piqa,acc_norm,0.7143634385201306,0.010539303948661908,0 +rte,acc,0.5379061371841155,0.03000984891252912,0 +sciq,acc,0.805,0.012535235623319327,0 +sciq,acc_norm,0.69,0.014632638658632905,0 +storycloze_2016,acc,0.6568679850347408,0.010978648097499866,0 +winogrande,acc,0.5224940805051302,0.014038257824059878,0 diff --git a/4b284b6boscar/evaluation/rankeval/4b284b6boscar_0.json b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_0.json new file mode 100644 index 0000000000000000000000000000000000000000..c5362eef297c70b30357499c55b6b08e0b43aedf --- /dev/null +++ b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.346, + "acc_stderr": 0.01505026612756445 + }, + "anli_r2": { + "acc": 0.322, + "acc_stderr": 0.014782913600996664 + }, + "anli_r3": { + "acc": 0.33916666666666667, + "acc_stderr": 0.013672343491681822 + }, + "cb": { + "acc": 0.21428571428571427, + "acc_stderr": 0.055328333517248834, + "f1": 0.14579916165482049 + }, + "copa": { + "acc": 0.71, + "acc_stderr": 0.045604802157206845 + }, + "hellaswag": { + "acc": 0.3952399920334595, + "acc_stderr": 0.00487903001059892, + "acc_norm": 0.48884684325831507, + "acc_norm_stderr": 0.004988539870174637 + }, + "rte": { + "acc": 0.5379061371841155, + "acc_stderr": 0.03000984891252912 + }, + "winogrande": { + "acc": 0.5224940805051302, + "acc_stderr": 0.014038257824059878 + }, + "storycloze_2016": { + "acc": 0.6568679850347408, + "acc_stderr": 0.010978648097499866 + }, + "boolq": { + "acc": 0.5296636085626911, + "acc_stderr": 0.008729651343606142 + }, + "arc_easy": { + "acc": 0.5286195286195287, + "acc_stderr": 0.010242962617927195, + "acc_norm": 0.4671717171717172, + "acc_norm_stderr": 0.01023764577885386 + }, + "arc_challenge": { + "acc": 0.23890784982935154, + "acc_stderr": 0.012461071376316614, + "acc_norm": 0.28071672354948807, + "acc_norm_stderr": 0.013131238126975578 + }, + "sciq": { + "acc": 0.805, + "acc_stderr": 0.012535235623319327, + "acc_norm": 0.69, + "acc_norm_stderr": 0.014632638658632905 + }, + "piqa": { + "acc": 0.7110990206746464, + "acc_stderr": 0.010575111841364901, + "acc_norm": 0.7143634385201306, + "acc_norm_stderr": 0.010539303948661908 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/rankeval/4b284b6boscar_1.csv b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..28521b01d01347a01d135e28193434984f8af1b6 --- /dev/null +++ b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.341,0.014998131348402709,0 +anli_r2,acc,0.342,0.015008706182121728,0 +anli_r3,acc,0.3408333333333333,0.013688600793296934,0 +arc_challenge,acc,0.2568259385665529,0.0127669237941168,0 +arc_challenge,acc_norm,0.2764505119453925,0.013069662474252427,0 +arc_easy,acc,0.547979797979798,0.010212436978834102,0 +arc_easy,acc_norm,0.5197811447811448,0.010251751199542731,0 +boolq,acc,0.537920489296636,0.008719868567159634,1 +cb,acc,0.32142857142857145,0.06297362289056341,1 +cb,f1,0.17647058823529413,,1 +copa,acc,0.72,0.04512608598542127,0 +hellaswag,acc,0.39603664608643696,0.00488072678798864,0 +hellaswag,acc_norm,0.4978092013543119,0.004989733513319103,0 +piqa,acc,0.7116430903155604,0.010569190399220638,0 +piqa,acc_norm,0.7138193688792165,0.010545318576106653,0 +rte,acc,0.5126353790613718,0.030086851767188564,0 +sciq,acc,0.849,0.01132816522334168,0 +sciq,acc_norm,0.825,0.012021627157731965,0 +storycloze_2016,acc,0.652592196686264,0.011010826502718745,0 +winogrande,acc,0.5232833464877664,0.014037241309573636,0 diff --git a/4b284b6boscar/evaluation/rankeval/4b284b6boscar_1.json b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_1.json new file mode 100644 index 0000000000000000000000000000000000000000..e90f9f4791b00b2df042754bcfe5ceafbf40335d --- /dev/null +++ b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.341, + "acc_stderr": 0.014998131348402709 + }, + "anli_r2": { + "acc": 0.342, + "acc_stderr": 0.015008706182121728 + }, + "anli_r3": { + "acc": 0.3408333333333333, + "acc_stderr": 0.013688600793296934 + }, + "cb": { + "acc": 0.32142857142857145, + "acc_stderr": 0.06297362289056341, + "f1": 0.17647058823529413 + }, + "copa": { + "acc": 0.72, + "acc_stderr": 0.04512608598542127 + }, + "hellaswag": { + "acc": 0.39603664608643696, + "acc_stderr": 0.00488072678798864, + "acc_norm": 0.4978092013543119, + "acc_norm_stderr": 0.004989733513319103 + }, + "rte": { + "acc": 0.5126353790613718, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5232833464877664, + "acc_stderr": 0.014037241309573636 + }, + "storycloze_2016": { + "acc": 0.652592196686264, + "acc_stderr": 0.011010826502718745 + }, + "boolq": { + "acc": 0.537920489296636, + "acc_stderr": 0.008719868567159634 + }, + "arc_easy": { + "acc": 0.547979797979798, + "acc_stderr": 0.010212436978834102, + "acc_norm": 0.5197811447811448, + "acc_norm_stderr": 0.010251751199542731 + }, + "arc_challenge": { + "acc": 0.2568259385665529, + "acc_stderr": 0.0127669237941168, + "acc_norm": 0.2764505119453925, + "acc_norm_stderr": 0.013069662474252427 + }, + "sciq": { + "acc": 0.849, + "acc_stderr": 0.01132816522334168, + "acc_norm": 0.825, + "acc_norm_stderr": 0.012021627157731965 + }, + "piqa": { + "acc": 0.7116430903155604, + "acc_stderr": 0.010569190399220638, + "acc_norm": 0.7138193688792165, + "acc_norm_stderr": 0.010545318576106653 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/rankeval/4b284b6boscar_2.csv b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..8fa9165db591a8ccd7b74fdc151b3ea8a698ec70 --- /dev/null +++ b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.327,0.014842213153411247,0 +anli_r2,acc,0.349,0.015080663991563102,0 +anli_r3,acc,0.335,0.01363087184382147,0 +arc_challenge,acc,0.2645051194539249,0.012889272949313366,0 +arc_challenge,acc_norm,0.29266211604095566,0.01329591610361942,0 +arc_easy,acc,0.5509259259259259,0.010206428316323363,0 +arc_easy,acc_norm,0.5311447811447811,0.010239860250021745,0 +boolq,acc,0.5314984709480123,0.00872768484861531,1 +cb,acc,0.3392857142857143,0.06384226561930825,1 +cb,f1,0.1735159817351598,,1 +copa,acc,0.69,0.04648231987117316,0 +hellaswag,acc,0.39364668392750446,0.004875595792850676,0 +hellaswag,acc_norm,0.49502091216889066,0.004989533998820353,0 +piqa,acc,0.7170837867247007,0.010508949177489684,0 +piqa,acc_norm,0.7187159956474428,0.010490509832327423,0 +rte,acc,0.5451263537906137,0.029973636495415255,0 +sciq,acc,0.864,0.010845350230472986,0 +sciq,acc_norm,0.857,0.011075814808567038,0 +storycloze_2016,acc,0.6461785141635489,0.011057260832171067,0 +winogrande,acc,0.5193370165745856,0.01404197273371297,0 diff --git a/4b284b6boscar/evaluation/rankeval/4b284b6boscar_2.json b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_2.json new file mode 100644 index 0000000000000000000000000000000000000000..07a5258478ba24fa53224cbe1b67b27e07d0caaf --- /dev/null +++ b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.327, + "acc_stderr": 0.014842213153411247 + }, + "anli_r2": { + "acc": 0.349, + "acc_stderr": 0.015080663991563102 + }, + "anli_r3": { + "acc": 0.335, + "acc_stderr": 0.01363087184382147 + }, + "cb": { + "acc": 0.3392857142857143, + "acc_stderr": 0.06384226561930825, + "f1": 0.1735159817351598 + }, + "copa": { + "acc": 0.69, + "acc_stderr": 0.04648231987117316 + }, + "hellaswag": { + "acc": 0.39364668392750446, + "acc_stderr": 0.004875595792850676, + "acc_norm": 0.49502091216889066, + "acc_norm_stderr": 0.004989533998820353 + }, + "rte": { + "acc": 0.5451263537906137, + "acc_stderr": 0.029973636495415255 + }, + "winogrande": { + "acc": 0.5193370165745856, + "acc_stderr": 0.01404197273371297 + }, + "storycloze_2016": { + "acc": 0.6461785141635489, + "acc_stderr": 0.011057260832171067 + }, + "boolq": { + "acc": 0.5314984709480123, + "acc_stderr": 0.00872768484861531 + }, + "arc_easy": { + "acc": 0.5509259259259259, + "acc_stderr": 0.010206428316323363, + "acc_norm": 0.5311447811447811, + "acc_norm_stderr": 0.010239860250021745 + }, + "arc_challenge": { + "acc": 0.2645051194539249, + "acc_stderr": 0.012889272949313366, + "acc_norm": 0.29266211604095566, + "acc_norm_stderr": 0.01329591610361942 + }, + "sciq": { + "acc": 0.864, + "acc_stderr": 0.010845350230472986, + "acc_norm": 0.857, + "acc_norm_stderr": 0.011075814808567038 + }, + "piqa": { + "acc": 0.7170837867247007, + "acc_stderr": 0.010508949177489684, + "acc_norm": 0.7187159956474428, + "acc_norm_stderr": 0.010490509832327423 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/rankeval/4b284b6boscar_3.csv b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..543be4bcb644ebda35cb43cb6d39cf565a9bcef8 --- /dev/null +++ b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.329,0.01486539538592837,0 +anli_r2,acc,0.317,0.014721675438880229,0 +anli_r3,acc,0.335,0.013630871843821474,0 +arc_challenge,acc,0.2551194539249147,0.012739038695202104,0 +arc_challenge,acc_norm,0.28668941979522183,0.013214986329274763,0 +arc_easy,acc,0.5547138047138047,0.010198171137873868,0 +arc_easy,acc_norm,0.5496632996632996,0.010209047724374146,0 +boolq,acc,0.5146788990825688,0.008741285568667918,1 +cb,acc,0.35714285714285715,0.06460957383809221,1 +cb,f1,0.2169237961664329,,1 +copa,acc,0.7,0.046056618647183814,0 +hellaswag,acc,0.3952399920334595,0.0048790300105989205,0 +hellaswag,acc_norm,0.4963154750049791,0.00498964592981144,0 +piqa,acc,0.7154515778019587,0.010527218464130607,0 +piqa,acc_norm,0.7143634385201306,0.010539303948661911,0 +rte,acc,0.5306859205776173,0.03003973059219781,0 +sciq,acc,0.866,0.010777762298369681,0 +sciq,acc_norm,0.86,0.010978183844357791,0 +storycloze_2016,acc,0.6536611437733832,0.01100287402644642,0 +winogrande,acc,0.5240726124704025,0.014036189665395132,0 diff --git a/4b284b6boscar/evaluation/rankeval/4b284b6boscar_3.json b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_3.json new file mode 100644 index 0000000000000000000000000000000000000000..c3d14fd9b2ef9eb896d14d21bdb697997e36f8b3 --- /dev/null +++ b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.329, + "acc_stderr": 0.01486539538592837 + }, + "anli_r2": { + "acc": 0.317, + "acc_stderr": 0.014721675438880229 + }, + "anli_r3": { + "acc": 0.335, + "acc_stderr": 0.013630871843821474 + }, + "cb": { + "acc": 0.35714285714285715, + "acc_stderr": 0.06460957383809221, + "f1": 0.2169237961664329 + }, + "copa": { + "acc": 0.7, + "acc_stderr": 0.046056618647183814 + }, + "hellaswag": { + "acc": 0.3952399920334595, + "acc_stderr": 0.0048790300105989205, + "acc_norm": 0.4963154750049791, + "acc_norm_stderr": 0.00498964592981144 + }, + "rte": { + "acc": 0.5306859205776173, + "acc_stderr": 0.03003973059219781 + }, + "winogrande": { + "acc": 0.5240726124704025, + "acc_stderr": 0.014036189665395132 + }, + "storycloze_2016": { + "acc": 0.6536611437733832, + "acc_stderr": 0.01100287402644642 + }, + "boolq": { + "acc": 0.5146788990825688, + "acc_stderr": 0.008741285568667918 + }, + "arc_easy": { + "acc": 0.5547138047138047, + "acc_stderr": 0.010198171137873868, + "acc_norm": 0.5496632996632996, + "acc_norm_stderr": 0.010209047724374146 + }, + "arc_challenge": { + "acc": 0.2551194539249147, + "acc_stderr": 0.012739038695202104, + "acc_norm": 0.28668941979522183, + "acc_norm_stderr": 0.013214986329274763 + }, + "sciq": { + "acc": 0.866, + "acc_stderr": 0.010777762298369681, + "acc_norm": 0.86, + "acc_norm_stderr": 0.010978183844357791 + }, + "piqa": { + "acc": 0.7154515778019587, + "acc_stderr": 0.010527218464130607, + "acc_norm": 0.7143634385201306, + "acc_norm_stderr": 0.010539303948661911 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/rankeval/4b284b6boscar_4.csv b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..9679d679bb4eb14edce6c6b2536a4bc3b153edd3 --- /dev/null +++ b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.343,0.015019206922356951,0 +anli_r2,acc,0.329,0.014865395385928367,0 +anli_r3,acc,0.35,0.013774667009018556,0 +arc_challenge,acc,0.257679180887372,0.012780770562768405,0 +arc_challenge,acc_norm,0.2909556313993174,0.013273077865907581,0 +arc_easy,acc,0.5526094276094277,0.010202832385415646,0 +arc_easy,acc_norm,0.553030303030303,0.010201914927791678,0 +boolq,acc,0.5125382262996941,0.008742304974218316,1 +cb,acc,0.375,0.06527912098338669,1 +cb,f1,0.2518518518518518,,1 +copa,acc,0.71,0.04560480215720684,0 +hellaswag,acc,0.39603664608643696,0.004880726787988636,0 +hellaswag,acc_norm,0.4994025094602669,0.004989777848791011,0 +piqa,acc,0.719260065288357,0.010484325438311827,0 +piqa,acc_norm,0.7105549510337323,0.010581014740675616,0 +rte,acc,0.51985559566787,0.030072723167317177,0 +sciq,acc,0.876,0.010427498872343961,0 +sciq,acc_norm,0.867,0.010743669132397339,0 +storycloze_2016,acc,0.652592196686264,0.011010826502718738,0 +winogrande,acc,0.526440410418311,0.014032823874407229,0 diff --git a/4b284b6boscar/evaluation/rankeval/4b284b6boscar_4.json b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_4.json new file mode 100644 index 0000000000000000000000000000000000000000..cc52f7489589dc02964abd8fe3ff480532afe19e --- /dev/null +++ b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.343, + "acc_stderr": 0.015019206922356951 + }, + "anli_r2": { + "acc": 0.329, + "acc_stderr": 0.014865395385928367 + }, + "anli_r3": { + "acc": 0.35, + "acc_stderr": 0.013774667009018556 + }, + "cb": { + "acc": 0.375, + "acc_stderr": 0.06527912098338669, + "f1": 0.2518518518518518 + }, + "copa": { + "acc": 0.71, + "acc_stderr": 0.04560480215720684 + }, + "hellaswag": { + "acc": 0.39603664608643696, + "acc_stderr": 0.004880726787988636, + "acc_norm": 0.4994025094602669, + "acc_norm_stderr": 0.004989777848791011 + }, + "rte": { + "acc": 0.51985559566787, + "acc_stderr": 0.030072723167317177 + }, + "winogrande": { + "acc": 0.526440410418311, + "acc_stderr": 0.014032823874407229 + }, + "storycloze_2016": { + "acc": 0.652592196686264, + "acc_stderr": 0.011010826502718738 + }, + "boolq": { + "acc": 0.5125382262996941, + "acc_stderr": 0.008742304974218316 + }, + "arc_easy": { + "acc": 0.5526094276094277, + "acc_stderr": 0.010202832385415646, + "acc_norm": 0.553030303030303, + "acc_norm_stderr": 0.010201914927791678 + }, + "arc_challenge": { + "acc": 0.257679180887372, + "acc_stderr": 0.012780770562768405, + "acc_norm": 0.2909556313993174, + "acc_norm_stderr": 0.013273077865907581 + }, + "sciq": { + "acc": 0.876, + "acc_stderr": 0.010427498872343961, + "acc_norm": 0.867, + "acc_norm_stderr": 0.010743669132397339 + }, + "piqa": { + "acc": 0.719260065288357, + "acc_stderr": 0.010484325438311827, + "acc_norm": 0.7105549510337323, + "acc_norm_stderr": 0.010581014740675616 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6boscar/evaluation/rankeval/4b284b6boscar_5.csv b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..96eeeae0d7b3ac17160ef7963c8366e5700c6f93 --- /dev/null +++ b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.34,0.014987482264363937,0 +anli_r2,acc,0.342,0.015008706182121728,0 +anli_r3,acc,0.33916666666666667,0.013672343491681819,0 +arc_challenge,acc,0.2687713310580205,0.01295506596371069,0 +arc_challenge,acc_norm,0.28498293515358364,0.013191348179838793,0 +arc_easy,acc,0.5601851851851852,0.010185185185185316,0 +arc_easy,acc_norm,0.5660774410774411,0.010169795770462103,0 +boolq,acc,0.5110091743119266,0.008742934884517653,1 +cb,acc,0.375,0.06527912098338669,1 +cb,f1,0.18421052631578946,,1 +copa,acc,0.74,0.0440844002276808,0 +hellaswag,acc,0.39603664608643696,0.004880726787988638,0 +hellaswag,acc_norm,0.5022903804023103,0.004989729059957431,0 +piqa,acc,0.7176278563656148,0.01050282166855538,0 +piqa,acc_norm,0.7116430903155604,0.010569190399220656,0 +rte,acc,0.5306859205776173,0.030039730592197812,0 +sciq,acc,0.875,0.010463483381956722,0 +sciq,acc_norm,0.875,0.010463483381956722,0 +storycloze_2016,acc,0.6531266702298236,0.011006857922124124,0 +winogrande,acc,0.5232833464877664,0.01403724130957364,0 diff --git a/4b284b6boscar/evaluation/rankeval/4b284b6boscar_5.json b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_5.json new file mode 100644 index 0000000000000000000000000000000000000000..16e74d5ff2393b93a13b49b44ecb7b99e7427116 --- /dev/null +++ b/4b284b6boscar/evaluation/rankeval/4b284b6boscar_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r2": { + "acc": 0.342, + "acc_stderr": 0.015008706182121728 + }, + "anli_r3": { + "acc": 0.33916666666666667, + "acc_stderr": 0.013672343491681819 + }, + "cb": { + "acc": 0.375, + "acc_stderr": 0.06527912098338669, + "f1": 0.18421052631578946 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.0440844002276808 + }, + "hellaswag": { + "acc": 0.39603664608643696, + "acc_stderr": 0.004880726787988638, + "acc_norm": 0.5022903804023103, + "acc_norm_stderr": 0.004989729059957431 + }, + "rte": { + "acc": 0.5306859205776173, + "acc_stderr": 0.030039730592197812 + }, + "winogrande": { + "acc": 0.5232833464877664, + "acc_stderr": 0.01403724130957364 + }, + "storycloze_2016": { + "acc": 0.6531266702298236, + "acc_stderr": 0.011006857922124124 + }, + "boolq": { + "acc": 0.5110091743119266, + "acc_stderr": 0.008742934884517653 + }, + "arc_easy": { + "acc": 0.5601851851851852, + "acc_stderr": 0.010185185185185316, + "acc_norm": 0.5660774410774411, + "acc_norm_stderr": 0.010169795770462103 + }, + "arc_challenge": { + "acc": 0.2687713310580205, + "acc_stderr": 0.01295506596371069, + "acc_norm": 0.28498293515358364, + "acc_norm_stderr": 0.013191348179838793 + }, + "sciq": { + "acc": 0.875, + "acc_stderr": 0.010463483381956722, + "acc_norm": 0.875, + "acc_norm_stderr": 0.010463483381956722 + }, + "piqa": { + "acc": 0.7176278563656148, + "acc_stderr": 0.01050282166855538, + "acc_norm": 0.7116430903155604, + "acc_norm_stderr": 0.010569190399220656 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8f1abea32e74186da1264ebe451c5bcc1040d1a --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a9ceb6d547168ab95b1bd84be24ac8c3b08cfc57fe2d4b40e4b21d57209f49d +size 199058647 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf792024fd9e736ebbffc42acb1f324b6122cd62 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d86cb32c1b09d7908023a2e4cae870b404919f3416d321cf2f376aa6f63d1ad +size 199058647 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f947d6a022289d31109642018d6a9275e6ce2202 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29e3ab3c59e31e014e81981a559cbcbf338b028041b0db9398e256b4169735b5 +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..782af115d1ff3407d0eb29af2c46f9307c4abce0 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61731bd18a4e8088e5d951cd968d6c4f9e7e1624091b775b4d46b0b4a232f9d6 +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8367159264933cba6a345d7f0805cd3a88f27b45 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a627824af272a3849d68cbfe2da2d55f3551b5bdc244d1bc1716f8164dd431b +size 199058797 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e866b1bed7d7d856781feec893abe6fc1015cdf5 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9083edcfc84db3771ce198ce0d395205f8e35bb210d6d36020a9a9150b8baae1 +size 199058797 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9497a44834c5b145581382f41a1f006c8bc86377 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a2c66b15a1d0635a9f6acd241bb26aa8edf72e6710694869d5d8f4659a67ed5 +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..806ba86a23b4c92aecf82721c6a75ed0fb54f7b5 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f2a6b3a61236d3b2446c3b16084611c155f4dedfa300eccf74c19085b2e0e55 +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cd440d0fc2c8db72a5a2b26c3bbe50dc59ac7a6 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85825731a2e3ef867a27e061bcb8d7c0e174dd0caea4508da066684337d37135 +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f733218053f7d5f81c353e2691f1eb4332c95abc --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77fb48a746279edb74cbec29d1a7c9b00cefbcd9d1fa31262bc309b170a654eb +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d19fe2b34ba372e7f4c00ef2fc060f0a437304a3 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb517c9efb522e62e0639d791c098c7b7546c1befa19ab61d6011c036f76dd0d +size 199058797 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..192b93cab9277c406187b469d0a73a06778b4c99 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4a16184675d35a9b23a87b210f648ef57b763d7f0487ad91cb3a446ed05ef4f +size 199058797 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ba2077f11dec7a61b882d496cf3644830748297 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d2dc0f8f971bd8f7c9eff5140f188566c3d5e1d06ef933eadf1f3a0e992366c +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd3343ef74a3a7d3dccba6a132c0ccc46cf2da9c --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:099be6acce8e0341a05435ee3f81e184a59f598e5c1cc0d07bd8a64bca3d6d46 +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06f43efb0f2277291ab0459503b8ebf0a5dc274d --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2cd263052c532acb80fd2bafdb6dac42c1808626e80f61733a1a04e185f2bbf +size 199058669 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca688052ca430a366b2d4208da26dfe4e329b2fa --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2ecb4fcee8368ea77efafb2575aa3e30bd24e677eacb7e1c437bb8a18a8964d +size 199058669 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4686c4b299e56ec554f5c6896f61012f7d53400 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64924156442e8d972bceb37d0a6b1c42b3db8721925f17c9d3ecc9a362686954 +size 199058797 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53290f17d5e4db05abfc82193964db0ae452f0c8 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30228a088bcf068669b6ea5e2816bfc96fed1512251c480af5b1634429acf79c +size 199058797 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..192b1c722c1769648128ef2e42c71df9e42bab64 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5634b292cc5e65fbcdfa8aabc8eab862822c44cf6759a5606ec17b3891634175 +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a6b85759901622c16e9f642383cf7c26d40c9fe --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f9b733961aed500c0c19c7f877266864c3d4cc7093a0eb72dd89501ebc87d8f +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27be4f8ade92ea256f03b93a04542bab9e5149f4 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42daff45818e69a95961d65af89e43273a7ac1a6fff511950ff88cbc00ae847f +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..044386e0e324d874369fa2f2109fe629d547ae2f --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:792fa05879db10f3fcbf2cb6cee88990012cd7cc01685e1a3d1504436c79a4a6 +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ceb2680bbc9dd964317584ccca3c0b16bd07c15c --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:673249f4df294e772051ba89bfebdb8ffb32cc4dcc327f8fa735810f77948b1d +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9567703602dcdd8e8cd6fd9690fe5c6c6ca0fb17 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0cddb7365c2572378b6bc9090fbe36b91f67745837121307486ed0628769883 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..872cc1f8ffb603cc4540d24491bd6418bcc51aad --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc3aa57d023c01400582960df5544a51cebb603c65bc10bba0cdd6b6236450fd +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51a607dd346f93c2212c9847429717da06d0233a --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24416c83c5564b906328a9fe616be3beae90e4b64db539bb23523ead02dcb8ea +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..363ccfa6af22fa73d9e61bec5ebccecc3a33f693 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16ee4e475e20fdbcab9898c6cddc2d42eab98dd2dfda3ba96eeafac9be0dd7c1 +size 199058797 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a7b839b5eb4be8915fac4ae1bb5947caf6c7190 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9f4b0615e967b61c929e0c4ddf5625b63b8aad5b23a47df9046498ed65bec1e +size 199058797 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bd74b66747bd237cf641e42fa6f0844efeac2c7 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29c07bb9b0db2257a19a0379aff6aa69ca50a5ef9609995cf55ffb425ad57b94 +size 199058605 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6627c0709269121c4c4aeeac5db402a6268fb7f5 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba2366e91ef3de0e6b434835a09a78ef3b21bf1d2a73192c898ba60171ebc16c +size 199058605 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6b5f84e3dc15742d2f8e5169b6bd18b1ac4f629 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f9d843d16e2d3281a6aa47613f1eb307e48b2ecaa1f12a0655ec511a6baf4e5 +size 199058669 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7e74a0cfd8ccb0b181a24487d1100f07a51c195 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f73e3637b534a638403e83f6eb5af89ae8ead30541fefff041c7d61d1587dc67 +size 199058669 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da656d65daefecf4ddaefe3c89e4f9c22c14db03 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d8eef23e061ae79cf5b3d0f55a1b5b5ba830df89f16f4169949dc717b256430 +size 199058797 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3509cef4e6531a361c3efae72eaa51041b7a127 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23cfc056aa12b972c4a13d58e96de0b86af785a449858906bda9d59279d7ceb2 +size 199058797 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4cab1a473c27f524bbb8a3cb60cde8821462fd0 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d857acf329cac4379d0f4a633394668f3f10ae3e44b76cc77e986ba3c3dbf50c +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dd2ddebfc2d6b5ddd2a1db9fe1572c091225edc --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c3d36166af220dd7c81a1d780ab245d1760962cb78f91f2a5b1bcfb2a6a194c +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da0f8d8ea37b42627d75ba97f6c538ff6938a806 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dcaf485b617caf738727bbb7aeee9db4f52f4292e2af10e901c5a3a0072f5d4 +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d505008a9fc0296ce6b4177f2be5e7171130d26e --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd12bcb4dcc57081f4d8014aa1e5c17a445e4d6f002fdb3d7a4264c6cc343043 +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84d9e4e5dc8129f5c961511cdd5700409785f0ee --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aff65765c9b9c845aa0f6ba06525884d046dfe518859882884b5fe95b35334d8 +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..052c3eab02f3e03b2a26d0b78b48d5bbc20df2fa --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81115c907ad773f8d946fd4bdbde4c1ac9e549cb156f7ce8318334ba3ea7c0fb +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b21b3a4be41395ec79ee5f5c7c0ff81c6e40e9e --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b24dcaa3942c67398acc66dd6070bd07ef58cbfa5561cd339fc2f98b224c84c0 +size 199058797 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..462ea30e80b3bcf0f05f056a309093dc227faea4 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8113484ee9d86562078a2e20dcf224248e39e87c8536b0af843dbd964960e863 +size 199058797 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..033cbac511225d72cf68dcb7513d7bd45eff5ba8 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cedb7587ec082c03f29010765ef7dcc29c913931306e522e127815c1ea15b88 +size 199058669 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c373dae6ad6d29c42003128a4fd65d829fc84cad --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab290f804c399a98916c92bdbc14d09a50a7330a9ac3fe01bfc4010e41e63425 +size 199058669 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..869a54eeabc93f7edf5407ef4c48cce8ba7ec108 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5bca3077232c1a9592f35f2c6f52bd9d4bd2ee02b0845b59ab34a5b3505010c +size 199058850 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6f29e13564d51933ef1bd97f7adac292b298da1 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5ea61f2b15b2ea2470f57fa1806788de99837ebb057c5db978bbf4c99021879 +size 199058850 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2300cfef18a38f1fa8ea2bb01857a70f42e53bf --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9709cf103e8ef260eaa8e67124b022987a5fab8f2311406d0ea602bf5951af1 +size 199058669 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da7feb49441b90829478276ff944e67e564ff33f --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e87e061b851c4e9cb55bcbf742f951dbfcb255e69a4bc68653383915ae68a89 +size 199058669 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64af450662b9b3eeb50b16622e5948183119b284 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60223758d8e7ffed7007c60d67ad6d2e6d9f7c08f6b9103010fb110445d0cf9e +size 199058797 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c5a99045646d7208901bf750bc29841a2427c64 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f81a41d2fdd72d1dbaf6f70d2acf1032cbda99bf856145b6de85f137b9850712 +size 199058797 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fc63d31d66765be99fdfeeece4987820b56b33d --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:653f4e06c83139c876e97e832a2518576ad3519493bf99e2b7dd1e1f4a25a3a8 +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a06ae639dd8f3b7cedd3a4d05f6365b6564524e6 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be10c5daba9784ed4f4e92551d40250c8ac2f336a90c36fbd12e5a8751acf4c6 +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4037cdc61f934dac9430701e89683e7b11a993ea --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c74b171f0be5eeda29d3e18fcdf6cb417326221d26b5655a49dddff6cbef49eb +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..165b63983a74cc7d820aa8ec31cb1b6df536f83b --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:553a800c2d0dbe633ea5a89ab47ea58c49fe9dc73519b31e166cf186d2c961da +size 199058733 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8337464e73b8e2cde373d185adf9def4217d6668 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2994519f7951a1cec4d6c6c06323910065dffb500bb62d20c2eb93e0e9abbc7f +size 199058669 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb88ab9dd0db4afd42026173e48726352992a44e --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac0dc6c014b816a499aa01cc053efdaf304c727c108498126568210f641b208e +size 199058669 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..905ec7f311f173d4e147f123d153d4b7e396d589 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41e79d3720962a73136df4ca3ffda62fa277110c078b3bde3eed8c88a0f1990d +size 199058925 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6804468296b1115abac82d4e737158878266f20 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:324c6827c7e60516b4f71e6fcb2839dd88c2ad73ef86fd0f715ea99e94d27ab1 +size 199058925 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b63a81e5e6b8745b5982356cfefb18ebd372ffbd --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f022c0ff23fe586a94552e1ed519f5e36cd81d2d72b1770548b90af5b1d02bc +size 199058605 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63ce8c7a4135ba21566657d593ade2c7d2201524 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c57da376f7728d774b2ac2df0dd52b38ccf326fae7e9fd2c31c4a11410ada515 +size 199058605 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebc686e97874e3580635c2198fd8b12a15c52534 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6732467bbee0bd99bb33a98f1be3b28e2f06ce7f6aac4212d29363a4464d189d +size 199058605 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf9040fa090246d03dc363387dbe200f976640be --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27be487cc6566fc4d2d9dcd0f23b47232a0509890aa956f3c1c038964d6b968d +size 199058605 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab4b30a1630edaf42ef76a1c5ba494cb400b9256 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23cb30b397faccb5089d0bf11cccf6b741615d65117e32f7885adb332caf33df +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b42ed4ccd49e79b17643a04ab8f43de2f4c3962 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab0e66ac2f473189bf09eabf8dc4c58fa5cf90722bd93df43cd998db995f1cff +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5de249aed09454eaf99613b053234c1926d35f1 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb5bd46167dc7bd2fe862f4b085c1689e2c8e1e3dce8e3e7e0ac4a9b808155e0 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6360ddd6455a420ecdf0aa8e402d553cecae5aa2 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4c4071da0fa4445844372611e09e478c672da3cc9f0aa49fc87290dc2bee815 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d561e214727a386ad98e1bec0654e91c0265e6a3 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e25909336f9570b9235c22421e7fc4897d483ef4ab56b580c383ef4e658d41c +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4111503070f926c249888f798be856df48aad279 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:873b485ef1ad31eb04e54e470fd39c12dd916ec0fd61d2cf6d5dce0f7d07966b +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09437dc0c8864ed8cd86a593a476c1954918ca50 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c35fa9bd2623b14b65e77e01d64db9defc123a2b81d8b5a09591bf5b84a31cf4 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f664c81806899f33ed065b868505a76c892f256 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:201539d7b79218739731404dd884a6606e409e380aced85523f87c205cb9e6eb +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41bca594548a62796ce7d226dcb79bd7558979cd --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caf26075bfc18eb65e01ebe1470bb2bf79fd521cf5b69288709a16010601afc5 +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c0f002251741e1f6f50cd8c7f67df59ed337590 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7a86af65305409377f845215d814d89360e92ae909f1cb968e13b8cc9961bbb +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdec70a66b1907c11e1faea8a73e4b52aa5a27a3 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30cb53a23681af21dc69e039204002e24f9a5b9ce63beef56f624bcd4d0b806a +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf1a22dcc42fcddb63d872b384e23d3fa90c79f9 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5a1a6bf0cd6e50a0e22d6d927753229b0c0ffae6b7ce0186d4b22f3710a0a3d +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..807d1216d1e6997c2a18df864f81b8698fe62888 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f571698c2ac335031c6c6d33cbbc3d89b8df2e7073685f1844ddfd1135dd9dd +size 199058978 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20e64356d60867e2abf4f4f993495bb0d09da1f0 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:419e3359176886d80e1c7a2c1db9bd9122ae21d0fd5acd03d6bcda8d7051f417 +size 199058978 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08af9815a4a9d91f041634184126abd2a1b6359c --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:771a8d9573ac33d78c2cf6e644aa2d36b5e4bc20656438044a216032af8e1624 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ec67337df8fac03ed4699d9022bb4dae3e7b2b2 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba84fda5eabfce4e52b4b6916ca477736029664dd7a879738bbd7abed29a2bf8 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c6078d6a18edac8ad03e9493dd1bcf688ff40fc --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4f0d98708b33b772ff37e8b29b03a137f740759550f348e6fe7287e06b9e37d +size 199058647 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf6cb3e2a6f3fa421894de9215f56250ecdcdd2c --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5162a181cb5db2083b231c73747820f982649ba909f01dba98b03d00154aade +size 199058647 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dca5aada078128432e2ce1ce84adf9c01737014 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0351cdfe249500746f887c53ec33abd72df28ed7c47ab5915352113868db346e +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be30a89f14d880b88ad00c6acdfda2c6a8a4dbfb --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5941eeec6539198bb33a15388c84ddaa43ad9dd599ce6ddc6628b5cea5658d0 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c3ea8b79314bbb3e00cc896871a8b3fd3309af2 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2828e81d0353cd9647a2740ed536c61bbd8074801bc7a902c8b96e89db019229 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6008bac58af2d7b97068234a886bf5a5aa21f5ab --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0a8c55a10e5613c7cf5dfc838990f9cb03e1bd01a94a730b78fcd686d861d35 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d790fc2125036310d76d0b9d15e6aa53b711365 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b1ad167ed085f5665fa658aeea8eeb4f9d2fa2ee05bdba77444f1f59c458954 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c4f4ac0463eeac35fda4da90134fa3c376a47f6 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07f6fee3795d8b29dc7c8072da56a62c1e575933f64f1c0ca1929866441f9737 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d3998f5b9f4fd8fb6ec3df31122c2e69c0130ac --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:432e6d8b83deb4a9fdce4d5f4a229882023d133cb670b5626030c968180d5428 +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84abf527bb56cee215219e48b059b80906044cdd --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51c24987bf6954df6bd53e7625e9cfca180c2739793d4670eed59c903dd330ef +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50727d1eda8508b28d8005e2fa81ae0bfbfef5a1 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e531a5bc4a32590799ee34c3a25b80e62ce74d97c7212629613789d9712cee27 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c066619ff2df3f30853dd316bc1f391c23b2026 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:077ee8ea806b4c891e7231d41675117ff4ef3099d8f6a7b66dd1ddbc24aa2af6 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a470c931ce1c3b75fb0a216e233808ae0cd7508 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e540a8a9ef3ec6663185b804cdcada0c55497c5ffcc9437b274eb0ba5d09488 +size 199058850 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03867f4e4a5a6859a27f7bb59fc53a539299991a --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cd2848783045f43e56802d2ca9ec53a9df67ee43a81aacd83b12fe554953ee9 +size 199058850 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22868e5dcf432bdb43098a007c91f3990053cdee --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42b1251661c3337537ef08b3ae588a0fca8f72682d0cc157506ae7a648cfcb72 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ae0d2105dc0208f598a2ecc77ffe649da9f0a31 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78c28e00df682e13311dcad40107bbd9ce61c48ed283a3bbdd23753f9cfc7f4a +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18bfd83f419dca96205e9355fdcc097760f33c18 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeaa985769fecb946c1824a61b73f87b26aadd52934bc74d2830e9917781dfe8 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f6c95b9aebb6070d052f4ac6e3591cb40bb47e1 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b5eb17217e0cdc672190a40ff251656abab9e50879e76d18233e3ac2afa0807 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..924306597f7a96d9873317660575f667fa508a8f --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3db9b0dd93fd47f5b6a817402487e22dc3965e30b645a4470f80dec1dc18107f +size 199058594 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f9c16872cd8b5b270e5cf3a801cf0edc1ff772c --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b89abf468bfe3f84b7ac07337a7328d2f9a5daaa1d104f14df053a1037e2667 +size 199058594 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27120439378c1d2c25f4800102baba8a398bdff9 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a34f7bdad912098ddb61358a9c7b6b0c1cf5e2bdeca0e729d39d1b4b7f3fce10 +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c4fe38a03daa785da1288d655d9050be1e79203 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84e343a7f49f0b8c085569367e1215a66abd6140336f3287af5c188359e87da9 +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0594cfadf53e1c547037b39be37a189018786cd --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f5d0b447ce0b67c3463bf3d76bbd0a4a28f055163eae4f9ed9929e5d429374c +size 199058711 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cd48360bbf15f4311eb265834e8b7fbf56052fc --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38ba10dc15c30f9172ffc2e5a1748c76c1672599f90b743a85594c7f8751b753 +size 199058711 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd17dc92f6caf9305094d3456e228cd4b3e66660 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ada46473e6e23059d9500dfc183915f649b8f3261b69bd36d9e8966fe42872fa +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..315a946bfcb16052db7a451917924c865a2f3c09 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c704eeb741c2eb04e5d6c9b3e30ce3bc9b9f045a44cb3a335414e0eca62e927 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..915cde046ae0e1777af711598874a426db61e744 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b985e2c491f416cc0606d37f06227b33e4605450d72e1c58231a4ec9da347f52 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f091f3aa093b1029590eb686502ca144c31248ab --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d12a28c5b915a87072188f1f8bc2a903cca3291492c8398c54c38860ab31156 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46ae214887e581bf53357f194d0600fa6938c06a --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed04e1ae3e9daeb08053795aacaa5bfe837cae2af84ab2a097ecc406320cffa9 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2c6dd63b4b517db2d6c2df58ddd226ea54bded9 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9120b183c1196ac9ee55cebf1e025b85800e0b7ec82a0f3286034f77785bb6d6 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26dcc9198ca94acf001733eabb038182da712fa4 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e8c23cc85c806b1c203b5fd38fc384302e243c461a9eab9e062931230573a1d +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0df327c19658d3a41b8e85c924421f361d67a4d --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c087b6dd7f4cf18b87b1566b52b76b76fa70c1652c2e03a9c870bb0f37a41f9 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..813f23b151fb060a277ac16ac5c58e8a39e68719 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55f29d34bb117ad1588d7ee8e6e495fe7587718ab49db93dddf287e91e1e1363 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..571e2a11d59015557bc1505ec3af07cad11d8a91 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:191352a8d3bf1535e377a54b90be0afcb26b83037b11328603fd06159f38bf46 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f78986357cccac86e32de6fcc21358ae52f7bbd2 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea9c7a756ba28061dd6798a4102e5963cda05d68314b333e8aed11169432b71c +size 199058594 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78499b22422935500f345fe262629579531a78be --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a6dcf3d8aa47b8e748bd2f7035fc5f3ce47ca4e9a1701a037fc903aa0e73575 +size 199058594 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5522b60f2d99080fe91246c1bfe4e2688c42cff --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3b85aaceb9ddf160ba0cdd76a0a11588eeba10532f83995a62dc50164ffa539 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc0a6dad005ff5eb58e65d6704d5d084c045f9fe --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70605f64e416f579b160bf23d1f9edf6659a2dfa6f9b1035a96a695b4d16cf15 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa23171d50131c61926221c4d651c32178db4f77 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:720762b683eda9fa0c9095e3ea40ca170730fb13724b414377fd0d2ca4f45c43 +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfd48bd967c69ef0f5bea2841efea94225f62fa5 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fe34411b9f562ed699cee18ed6104bd5a303b88579efdbea1fd485663f91d77 +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c8b3c9fa78d75c60a06d965e4fa6ec828ff06c8 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f8ad5af6e1975dc6c78cf31c1bc9eb992d746f5407d6070058cb666e24bbab0 +size 199058850 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51703f5ced63e0def75cc0a717d74efc8219a70c --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3025c3c9bdfcae67d9ec2ef403442d7427838d8c1485e374308df52ba4affe6b +size 199058850 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cc2e50e6282bf70193d4e2b269a4969a399c1a8 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dd403d99da2c78e384a60a6c295207198299914516486696e7287546d51d8c0 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0c2d18aeeecd2eef544371d4399264f8de2613d --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae8d9bd9064272f08ec1be3a0a6570ec5d3a70afd5c5562b5c7d1a3424fde9dd +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b93767328ee41e48e39911fa8f705e22fc48dfa --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35ad364ba394d3ed9399f55e6a82baeb2dea0b9552c177577f2d1b214d25256f +size 199058647 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7827af92ec4b24cb45355b42a8d701b7aa63f2d9 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:833e24851adea5a92fb5dcde2c7d0f68310de6ed5dae094f93d81fb5721e707e +size 199058647 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34dc7128899fdab3c64eaa8810d203c6eab0a93c --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76527b482eda732eff2a690b9ce36a75220484b08a929b3a9ce90239a105c598 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ea3e3e43fb9a865fc60f038b6a17cf262402cab --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdebf8880737b5f3f96d55d96bff48c90a6683a46fb2df75d55e974ba10f0acf +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b34407e6bba3d51631a420890ac9a7760a3600a --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10cfadd7e914f4caed0125a86e4476b838cf051a1aabdbcb0b0ffc30580f7fc2 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b52a9384bdbb102ebfa361f5a197285bf1218e67 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4d10f58dd4de1897eaaa66a65bd025cb46978739c45db1da5a970b7f0b82d8a +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bccf965e8035f39e83a832e7104fc7bd35cf4557 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99610f7065771e154851bd864d8664fe5d6ff02e65b0f61d25cd17993a3b0795 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9027a57ae8461f34a1042fe03a701e29b6acdc62 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7049a469cd34c117e4c709d09486574d2c7b5753a1f426838d57831c02ece719 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76a03d68bd8e67ae0d551fcf2debe34fdeddd429 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89ed44d4eb1f2e1ee470c3a6ef21398d7cad9321e0aa168fcd2a923e794f566f +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2d9f8315db7e149d4a5d9c2cea74a2ee3c78785 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d619c8aeb12cc59bfd96e4b8867ea37016668d953506624dc11d16a2cf181c60 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7081d1f6deef67492f0a0cf121c05bb3192aedf --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aaf50517855f95c2e249e35a17586c65acfe6dd82f0d852f74dbe71a06511c4 +size 199058850 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eda3f00a4a02f47f464545aced598921ac61b399 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d38a3b9b4b87f57d7f2f700b528b0a3af0f80f549dfd6cda7c24d38c3ea2d534 +size 199058850 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a265e76153b58f8c45911dd3fe0c287881ea7e5b --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4c7cd9291570747c8f944c42b87c290f16f12fc7067ec4714f640eed4977073 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..575c30ec1acef4ff71eef663d21e7fc7badaa52c --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59d0c1d4a767cdca47a400d898f35478e29b861e775d5277457ce1a8992cca8a +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c0e4089ae2844638cdfe07447a0de6162348dbb --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:896ac45ae8be17f75127c4b9656f694695b819f31493f00f992f74245eae057c +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d0cd78c8b8db208511722147126e649b640686b --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:360ce7b9d44cc92e311aee452df3b7abf3e2eccd6111eaae18b4ee0df4d48644 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec7a1a22f08ce7a1d50b45f85a403cbb76f2ea57 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb67e4a351cb565928643e5e6291f3c4df53f2de10d03e9488b7fb9940565060 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f49fc642265264088ec2afe67900109f14f0305 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:507e78e34a5ef81fbade560c42ea5977a377dc504873e410ba85bc8ea4e4a48f +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19d6e666b03571509c0a3ee38e7cb664c2748ace --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6be86227f9c1cea563d321aad4e16240bd8b34d2eecbd5c5b18d1ac251f614c2 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c76b46b4eb3cc81b7557c220edc8fd9c4a16c34 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c195ce48e921c52c9cc8d0b8fbf730938889b0d5283a980c467453211dd67b31 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cb05695e20846828fc2edcad960614244ad7bd5 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbc853b1c90dc88030a98a8e662b282e84648ad9b754aa860487875c7548e0fa +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c8b47d02003250721dd14ff85941964ffed5b81 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd1c832610564ea0ffd6c5eda879600c12ee547054db5ce7584ad33b043d2d49 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1648843d96177190e93d810ad2d8deeed619dfc --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:257fcb72124a8c8fa9d740d2a90ed35c48d10099034ece9a95aec6048857b5ba +size 199058775 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d3bcc5d332ce667d2d246f25d86f85dcb7de2ef --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb00711f602966120c1be1068e8df998271fb223d3b16f97ec1fb496db268e9c +size 199058775 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e18a683cb4d225788e11dbb9adb42ca0d83b2d35 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb512767c29beec5fd911b10100c9446172ea6ff3c4fda893d3d8e3006040089 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84f495e08a0c21536a7eb5d8a08c0d9d74f24e0e --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:583260ecc649ca0df3f14a0d4a425f60cb1b5f598c6882710948d9f91564a22f +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c1b8e542474c46ca568a483881f8c56cc7a1f5e --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b14d81c0f45866676041eec99ef5ef42ea555b72a9a7a1bc9281eaf1a8db5b0 +size 199058850 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c8171882c8db1395d3623302522c032c4567441 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:738d95dde44ccb37cc3a9212584378e38c9259d9a37e012c24ba4bbd95a11362 +size 199058850 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bb20c2d2e8b03391f98a4d3981f300f982b6b56 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18e6472381706447b685ab57d5ae19e1cba18472b206cf95a4c6a739a82ab193 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..185e841aa684798eaab87b114ac4e8f848fe5fc1 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d622c08d6653f598ef5bcadbe9d41684e24ce5b3531522b47b0f5c1706229480 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc5d174a3d72eb952d299ecb447148d8431b72fd --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f8feff94dd7c96db986b288a345cc9838e85ff79a01dbd725e874db5d5db49c +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8bccc223b95157907b976a2389aef91e3062edf --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4da324064779b92027f1486353705752a7da5f85c59a7893885b137f1246183 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89157b6c31bbb7da5cb5fb4877ed104008360e2d --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0776ad50af58246cbda880f33352dafecb356446be24c00af3064ac950b20b59 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a09e4d392e7edb116ed0a96c2ae0467c9f62863 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dd94f316a5233557f849d35b7eb52692309a034c99146ea7e640656b8fd0959 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2984c0ff0ca7ee422eeaec096cb9fcb2a3415d4b --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9579fd53501758f51a33c35a36474d2088d709714dd2c1cd92dee79238d63521 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be831485986f7c67cb49445a555ebd22c2b1f5c0 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9134fd7657bb4bcac2fe0e8c37f47ed6b44a7a1c0ae57fceb2fa49fe4911c33 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a068b828509a73056ae630e7e164ad6ad6b1eae --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d4e90f26933216a8b3b06ca23e12359a32cc311f5b1f1b0101891b3063da6b2 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c7c40a84097a40cd4c32c625ebf7b5d62914053 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:436dd2ae26edfe1f4073e5e96584c07496f04c94fe3762df09052676b43df812 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bca05b60632f36a68d69b1952209486d563ec223 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fd08714201c92ae1fae241442e4be9062efaa1db468f10e3425e49bbad32427 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4367a15c530f5c712aea2a94e160bbb62204a940 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7109955a35f94d15c4e66e8482f6d292dc354fd6722bf6de1463332e84d1a06c +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..510450f1cde6d450650f7b1b548fbf1d2dd502c1 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9532452cfa50eef53815e52bc438945c757b56782197aea4d93247f8b615ba4 +size 199058914 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..182e086934f8513476f64f51de9c48303a9f80d3 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bad42e5ce217cd177c20c595932d7f5bd39d8f36c1dbbc9b67b8e5bc25a6220 +size 199058914 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee2ba7d4481f34874e824556c720521e467ef525 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a36584ebc8c06eda7fdb2cfae87ee868d6ef3c41c81109e3e4f3396f6f7b5f94 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ed5a0c44600292b7dd4634a1a62447bec073253 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2893311af9d16de8890c0d67f29425cbb1457e9d12ca379927100dbd7c0ce250 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d8b29495d115613dea08536f416bf46a7a677a3 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b477f7d52db1e29f87b0ad3e68a47dd1d8644eb6dc2774c045cf1ce5c433e08 +size 199058711 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57d994860bfc9a17f707bbb341d93f95d7cf0c7b --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c79c57f0dae764c93ff3a8bb36401f95800ccb42e1d38623dc9a78471fd3feb7 +size 199058711 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc3b9cc5567d29e164530b999dccccfe7a0575b1 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e90219efa6d1e397ffab54b19c96792a2462b8dd21fba1644b8586a87fa29b6 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89b29adf9bf3242a9fa4e53c11bd13df19dd7ee1 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:102ed150128c626cd533a4761a20bedab7539c1953f0caff6d9701966e063b5f +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a863292b8fb003477e9792991de8e2f78f11ed6 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83167a8e6499b37d8f3beb91a749efb71aa54a80aa1ebf22c42d5f38a5bcf8c5 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d898aa3e8f2bbc25a968faa6dbeebc6b6d3b2347 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1300299e13ebafe1e1c5031d4d17a97fee17dbd827c3a575d922792d790fcf51 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7372381ab970ba36496c8c3a6aeeec073a9e722a --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7347981837cd200308b0297e769f181309e6a8c81fa2a4dac0bc93020f8386c5 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c44e4c747791a7e662a13b26edaf2758b0e44c0 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f851d2fb5911e2581e9b1cda86feb5b3592df1346acd40174562c8bd6b38b47 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54d90d593c9b2117fc782527899ae9f1982c80ca --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a06f90e988689e43fa05b28c854ee40cf202aed59bdad0dd3a328b3e8a29bae +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1123d3b52a56ef46b75f971f561215724faa2a30 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1362c512de0015d75c6176f9c03864b3bb9a51b22b3f0748f419a692d0ae9b9d +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..346b6e90011a891d4d977736fbf349ad9ede0b6c --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8b70ae39b682c87f9a2b134358c9ead4ab242ca36f2404ca7cd07e9bc6c5d64 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6ec3509f43082c00b42741bca5532da5c071924 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bbbbf3def41d7e32a65f3ac64915583eebf1d70c441e8dfd6ffe730e1b607bb +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9289ce50ae51c29d7f94bfa8fefc2eb567087d7 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c2e5f90d723b7f8ca77e936d9cc1056aca8f59e376357d65898f93e3ca0a620 +size 199058850 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d645731f4b8873d64fd16595cdb1a3e51be88728 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccd3db8ac7e68ab19666b19f96d4f888812edad88e76ceacbb6e6ccca7cc51c0 +size 199058850 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88665ab75b05d7e966729886943f985557db570a --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07f707758b6aaecfd0007caa9024f6ef80c9e336cc7de3958f63768f565ff19f +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..576ef122883b63a342b48af907afc757313ddb5a --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67d59d9ee3aad49850970e4097656cd2d12915fc6aa399fbb6e08d353e26548c +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..154499d30ecbfb81cb1e54ebc0a4866501a16720 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0ad7fa3e02a52764f5de6f711be8364cf3b6cf2b4c50903b3e78903073fb34e +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f384c71da3375e0a39714f5b0dee9d27b021bb5 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f182cb06125193524f78ad821146baa958f8aaf9a2103f773e27ae9241bb8341 +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..020de41e738f93b888a1e23a1f8a9f7e0242c5c7 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18a11f5a35e93afd72e3bfa36ce3f7b3d13da2d047d45e19df69af9e1db7138c +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9fdc8402f6bd7cfedf26298f53cf3a4a04decec --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68e5f0fe6b4c7a98f5ae2144606e65bfef77ebc44454ed173000002c5635a791 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18636b0046b731c9c350e16320e39c7352dd30df --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54d45d9827305a85328c2503a3534a87d59b70f9c205688ae326dc1013ce2c33 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67950dbe51c20ac98c1e6dd27033065cefcdc000 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18400d8154f3aa315da55b450b167e44c25d6fb521a9d8077e133dc23fbe105c +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..245e08c879ec80fb4f318dfc1b4fd7b293fa2b48 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37f03ebe22fb7f49c75b3ff3e5197d2cbd598c044f112d45d785cdbce1e6538d +size 199058647 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d3798dec542feeaac928fc62119ae0b06bedd8f --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02dcab4deaf130f35f914ae30996a023f7290d9274f74e144dc67883b308c1c4 +size 199058647 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51dddb1a9ad1d991659731c9359ccb6f7c3a4312 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d804433c2abffa1f958471224909b11bd0c68d6d20414806db452ce38ed082c5 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e4724b66cbb88616e5e9abc246e150d598b1b10 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e29fd594e9cbdf519a2a1d13ce0a55435847a280b3d74a8ef5677cbe00535d0 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1932514ea2e6afe338adec2142efbfa7ee243aa8 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:523c9b6697311648180cf65f0e25f1e137aa954303cb6d1415d4b08369979e06 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ef811e0f0052abefbaa98092ee134b5a22da6a3 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:605cbb0ac38fa221085ee33080e88266084397dae4cb5ca91a1e75dcacda08a0 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..791d79d505c953710164d39167491fb98fad55e6 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a51d5f556934c52b97541ee111697ace290f52c95d38edea917ab690f4b0a5b +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33e24acb054c619709f1e9b7885e8e947dcddaac --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c5dcf8dac75eeebfbec6eb552883d0fe487c52df51d6e2f767cfb6b402e5190 +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b029d3aeff90fcadec4978006191dc57187df44 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c17eb0c4a0c415e861b658e65d41f0adbf4171ccbf90a495dba10604a758678a +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12a8c6f362d187779f18bcd68c93595d64b19767 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:319b449fb6dbb7635719ace5dc8e0c08accce15a5910a007ddc65f6349e6ee4e +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f602e92d57120caa6e563109baf4a88e67c1148f --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1ceb7cc0db438f6cc2461d7201129e2d935c0942c4d6e77aaf40dca9d0b0d0f +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..edbae5b63f2e49a52256925443757f290aa5fe39 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f239c43194c2abe19ffe869e4e0117324f1b534a406e947ab7cdae0f81749503 +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3f919493145fb2f6aca813dfa3a1e5545c25e1b --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca0bc1c70e66829ff9c8c061e01fb8b2f67d40fb4b35cb31a25a95ee6d48f107 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66caaf5cfb36a5a097e97934a7cddbe67316f210 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56b8e0fe70bc019c5dfa2d1796e313029df6604e176111ad5e9005d05640f67e +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8205495e730eebe040d57a30471cbbe337e4e33d --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb3683c3286c0432364dafa0d7c9dc1ad0b8d402c16e438f901963df603ef668 +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a33717691e6e97c5931b24e2cb558628448368c --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83fa2dc7eabb6593209b281d1bef2e817c31ff17913daa18e6daa82dae8cb15b +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1041e3820c2fb1ed2d7c2ddfc891c1772cd67f7b --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad25968ae89721443757352011fbb8b06af1f1c7c6600d1e56bd619ecb89cf33 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a28c8bb0ed8470d3e11533644d9188aa44088459 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f9fd709756e326b121cd08927b79c3cd6b87c51c79f43197fc3bfd97537891b +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ea9a7b054fe6dff2329fae24e232eb9958d06fd --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fe580c3959a70628e7c57441bf3fcac7cd107c951f2be6cf309fb7972dc7a28 +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..721523bb1d503dc7845508f74d7d1085502ee1fa --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c42a9cec01da50cea6b4f0b83f671359ebd77836d02a687d5d38a0d184146e0b +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71810b0f5679179298e738839d091fff0e343eb8 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cde85ed66c2ca6171cf3dd3a1957245143832b70cd8439a476ea90694086afc +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09622f26f3534bf2d426db09360c15b80c533fcf --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb5ef207793c361003e3ab245e286b9be05f36a578319e08302d2b1ab2cd65d2 +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..925ea2b2b1e546f2a5b7b71b99a069db470768b6 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01af011443b9bfb785ec3a647c099768d6c8c52eae542862984790240a12d471 +size 199058647 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79a07bb757ac85350a79f8183e513870a0b72c14 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3047114c7f0bb920ee6891daa0462238956e6285a73194215a9edd77eda6fab7 +size 199058647 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..785be2db6ec8862d429edbcf5866779e2fe17ecb --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b4004fb732fef02f473209f69810d55015d67a19734808f3b7a83281e952049 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffd0e97969e79e2e5d51bb9e48d2161eab55d12b --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a083b51488c20b3ca6feba8ffe864d7da6030b930a7d29da4e41cb5296a72e2f +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b3e2524e4cd4b7403446d456edbfc94058c2b9a --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:501147ab20060a91543f919b72a59089c8eea0e3a3cbfa5447c945e1274291f9 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a28dc424af71ec2321051af0b7aec3de1ccd318 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dc4bda3833a54fa76c13ace72006a49774edf5d15fe061a9b15686bbb1a8cd1 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b138ae822b9e3eaa7e479262ef3e44a30e8ef5b --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e04f20214419199c9ec5ea24429ac11e29319e0fcf6961211b9b09bd46595959 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..776951a578bd1857a5fefcece7a156010ed9ad7a --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9b7b68b14855886a3169d576f8e34730b86d62de12c90aed66c40f0b0ef0797 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c3b8c3a0ba595031fcca40cab044c9e7f1c3e56 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2f2a16f242a16105505480839c9700e22b97c6c1d433928a9a0acf62496c741 +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd80aa4a68f7ea9ebf46dcbb9d39cb8cb93cd34d --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6427e13531dd6f00353497795887faa4b0cfb048042abec8dadbb7a86c7db2ee +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d608be595d67a6630351609aa1fdbbd7721483a0 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec6008fbd4b1ccf2709fcef775dc8ba47d129bdb9a26600cc91c381ac6678f6f +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb4fa9b55df7cd8437c9753907b392fa6e147466 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da2b0268e26e6f6d3bb4eb24b0a9c319918314bcbf66dd944205ca03a3ebcd1e +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7ab7b09f3271452a1c389c9d1eb958081f4b721 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54a311ad910b517cea756cbe52e44ece296928e8477aa55454cfd62e8938b7ac +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..360fa5d27517f1cf3c6f2d3481675fb7cfd6d15b --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3962cb1cc0adb027e265e289489abc808626d08dbca11ead5d686b1a64d3761f +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1659c023462ca7afe06c6224d2bea586f50324d --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fe477c74f0f751e92baba6016390b0fd64604dd5904b62a2252bd2a870e2df8 +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17abfba4cf17325b968490bc8623878c41b20b7c --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b789dc987ab76068007f0dbab9f1dee518716fd04d26905fc63e9f2d1f0bff3f +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6241a7b5cb066a95bcf481bc528fc1e34eb67ede --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bca84730b5680462c0e93c424abb17891a790e9abf96a459454156121c2e96a +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db2996f9a2c5c2ba0c2d29ed324c79e244750dbe --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e1ba93fedc95b95049720cc80e44b7d7e65e1219ba91d2db68d0444a552d831 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3258305e5bb2f8b7f288fa856a8c3cd41fbc1fb0 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba434f15a8c87261f9b30166ccc1757611f71b5db1af310c8a975dd3ff34400a +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f167b6091fb9491f17fb32c3eee3b07c0fe9d6c8 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77ed66a69e7ca122dfdef72d68dbe9c4dd64b29d92d4a64d1f13363bf31376a1 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b7b7bea8929e187f635dcfb69bb0c7836cf6933 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:888ca6dc50dd97ee98350f4da6bc9bf0f2308a5436157a87f5edfc80e41f55e2 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef172a52b986352a0ce428bcc52de71b1768e5f3 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac4157d98237dece9fddc605c8f46e94d0223cbac77e7f9b21a2895802fe0416 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e716342eac34a380ac9827e7f580bdb465159d07 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4e5ab5ebfc3d1f2c31a2a2eb083abfe7077da9e4e14b2c07d81c3aebdf46b81 +size 199058647 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aff517a00586b1b49c08d499c3539fc64a979188 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f40a2c609abe3757eac1a9d46cfe7d2e3c1c366d270180edf2d808cea397677 +size 199058647 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0393cf2b8c5fdf69a40ccfe9fb99dbe64580da9 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b8f4f6c55a3ec6743d6b0a215f6bb377cf320aee0af92da654ca21a5e6f745e +size 199058850 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb0197f8cea850feefd8ffdd6175a3167d31d381 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:790447a4a6c892f71d84064523a7ae763d934ce4accc7121b403843027cdbc79 +size 199058850 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71bbc987c8e7e4d0a4f2beba8c13177fb725b374 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90e1ce3d937ae28a8c7fd8fd2c9b3987302a0118a3391462016f20aeee788c8b +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30afcd761919219a2d707dde1d4aa1b1f2c5b8f5 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18887917c276c102ac0311f746a08c67bef81dac2582e702d8c18263f62be1c1 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcf16d4fdc8394cda4f44c66d599d6b88efa3e92 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1470dc3be15a098aa9dc040e422395cd761d0fdf487469dcf1f4dbdcdb6d0aa +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1a09256c1a683712f3721ec3cdaea361617020f --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c077fce58338790e505acf2f919f8a91830cb6424729efce7d7ddce3fb6044a6 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e51aed775c05d3f7a01182da1e327524e97b13e8 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:325f26f13a83f8fb1e7d7ef4717b88650e18bdac3bc6c5cada94c17ba2461c6f +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59e6abf4d7258d66989bd35449d0477a6bed2aa9 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1c3920121e96d2b20f9cf974e1c05b288a0b411f2980fa20eecb66a38aa1f90 +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c2063d22b3416a46857d8c7381b74f61c18727d --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:395fe869685122c0464ff8b96ede0123e639a29a0ae4fb61e8fb95be30009b3c +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b9c126df654f7aeec736010106fb3cdbc9e57b2 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19e9ba934efbe2bf4a2b1e41c9f8f275d5f5a317bff237ff01cfcfdb1570a7cd +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b29ec98020c40a70f98434896c23943f60ed30c --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a19c48df48d594b9d210c7a4fc02198f1a5a7ca3240fe24df2b08de945dbc3d7 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4403bdb330b48682d4c5ca4525c1c68ac15e5654 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fb2eaae606d06d19cb50e474a7385a95d1f91e3555e18e770bfc5b3161dfc60 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e38b2d836832fd714d946152d32593319a71681b --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10f26192a793d6d2b92ad72133cbc3aefff2cc510ef832aaec9576d4e71d51a2 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23c85a5af21ea0c1f939ed80a3935c7dec1834e0 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c84ef3240db414f6e4f7adcd95172bfa79029ba4bbad3fb4f739882eb9873323 +size 199058722 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47aa108556b376d412cd47be4d926c3bdd6063af --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5680ccd116bffdf21e181a118164dcf9d86038ef5b5d77cbcb3153c47b5888d4 +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e851a0c66e3c67d222b6b8af9b9198e0e733b35 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faf5a943195cbf017b8617f6a71958aa62ed5998857877a2e0fb0cb380aa3522 +size 199058786 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab3c09e80bd50f69868bc22ceada810edfc0bea8 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbeb5438f70aa723d8e2950ae0ca9c5d0c0c0ed80540e79508b57e8ca98c2288 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bb7841d890062da4d298797bbd584d990d20b1b --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f06fad235d608e967ee601a2305817661082663329833c231cb11e04138d082 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79df0111d4f20b79ac8aec7445e032ce0f3ab9e8 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b08a73b31ee765eb6e72e07abe1f1240e0e595a4b9b271f09de5fa2d596442d +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58af0546a0aba658cfdfa2a8e4b152065bb2dec8 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0036162affedc4d3653fa4dd39920a331170833705d08aac57de4dc9e82d01d3 +size 199058658 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b807f246970b53592a3be27c05aeeec2c4792bc --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ba0033642fe2b1c4c86f5b93ec431059c41a60254fb9c9bd975247e337f2936 +size 199058839 diff --git a/4b284b6boscar/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a1950b6e39a2c1c20428db7ddbcb433eaa8dea8 --- /dev/null +++ b/4b284b6boscar/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17793ea8af71c5f59c887954dd939478091bc1bb45d44bd3ceb0fcef2f23cf0e +size 199058839 diff --git a/4b284b6boscar/global_step80108/layer_01-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d91c0f9766870ef896d6e909cbe297703f218574 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ddf235813ac01a4f66e75e998014efe0dbb90ffab4db96224df76fc25f87919 +size 167511299 diff --git a/4b284b6boscar/global_step80108/layer_01-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..825a44ffa0db163cbf8348d84990d7ebc5cc86e8 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20f89287686ac5b1bb76e2d30cbb5397e6f02576f83211fc842290b6a1211ad1 +size 167511299 diff --git a/4b284b6boscar/global_step80108/layer_03-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b5fb2b3ba52ac9daf609348153aaf27271ec237 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5a83a1d3977ab4ed34b4f9f81fac75e65015dfb73fd0a8fc712c6d64e22d776 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_03-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ec182496c7e93415daf2a5adb2b3d4ce5de9fcc --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a217d4c87aaefc35710a401a3c17102566674247dc6ada81f4b7d41df054687 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_04-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..102a6a757bb9af65ea54505e6a45b92ad9329f5d --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b48d8acd6f333c116df6a897ca60324322abf45d24729fa6cd75276411a1580 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_04-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fce1451d38c98b9d848218a05f247df28e9eb54c --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c98de794588bcf3a332cb5a141c4d9256b89fbc367126cb0c1bdeb3c290fbe44 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_05-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7062599f4562343c00055758713818d881c0cdf3 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:191f75d2f4cf3750a1bbf603b08d452f400cf07054b579498a3ea131590f62dc +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_05-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6c6ffc5df1bec3d2e4e470e59e73fc17cd91ab8 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6baff1ff74fa7d55d109aa69a51f2aaafde49b9b2766a9c516191bfeece6477 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_06-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae3010ee7cf7dd0e85acc9d6fab8b14ec8fe5aef --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73c841ea8884b97abd7534bbc2fc31d3c9443b14018387e25748bde8de99fdda +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_06-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5b3995b258f2d593a760a4d222955b28085c184 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:324b78d34cc7311edc9ed5a59944be4df84554e85b8e104718219afbb51f54d9 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_07-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f52ab9c4d38be212402375d8b66e3f58475cf18 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0a6bec3644632b86d48648491b428db97147d492a376a5d9ac0de2a521958ad +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_07-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b6d4fa88e3baae062422f184b3be675df836eba --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4de6b5d29ac71b07afe096dc50413dea8fcb9edeb76cd7d69078b3ac5c9265cf +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_08-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ee2b55e501c85b4762154c958de24b40b630035 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81fca2e2bcc135253f4a7ab75b7a733d55eb9def734951af205a6b8a0bee73c9 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_08-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85f10ae9f05e6499f750f3e981fe9b2be38d2af4 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d7960432f86c8dad526bf5438103ff9d7627455b0634a486cf56edb6c6fe007 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_09-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c8f7ff910f09b06312aa1bc6f0ae7ee49ebe4ab --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ec5448cd5c42b98cf13822347eb6ec60633f10100389e51a022b86a58ad9d5d +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_09-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..779d5ee22182c1c52f57bb7f9c51744ed37bd2b5 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef068f1bd96d14b95c6d1bd290d8742fe84aa4cb68f69bed12abc0deada0ca70 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_10-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44d24785994e3389fd189061a8cb263485dbca1d --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b57d553b4022f3a3a00410828a50b2283b68e7d34016a61da2672db2de48696 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_10-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bff191aa58980040d72c61c28f21f1fab9d5ecd --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6852d7e1615cb20b13daab52b0266d7fd80614d870800727f3a515c6f1048e5 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_11-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9270563c74ba57635e279b42b569c3570d2ffffb --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39323ac0c50c1cd0aa655a582ecc89c3b52a9a7f1f32df84fbc9fa976d78798a +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_11-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6e4f2af534ef65690df1620e8c91323a5ff4863 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b32b7f96b5103ae4ece5a7b46847d40ede6b023799f8d8478ebb7d8b448d83f +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_12-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dd78f32157b07de2faad7fb3ba67f6ebb0da4d1 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4971054dcbd6e91fbb1a54b35b5bf1ff3bb6cb84d426fdcbecc706eb4bfade08 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_12-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c32ad259d4b6720f060c41ed486b809bdf77476 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:999a07e2e7829fd968dd875ea829cd1dac2bbdbeff3d26620484829aa856ef13 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_13-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09160143a4a97c23a0bc73a6942a306b09afc754 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99685566f5485fe08350b6dec7b5e7a49b629a29d756c29d703672351be2f80f +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_13-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa51a2d617ee837be120ac8b74bb7be3a6c7efec --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a007c8d947a48f4d0a1b0fe6428abfac4201699df8510581f957319d40eb6f55 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_14-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76d74f48cef092aae764b0a8b4c49f4a642a79df --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50920aa45c4a6eb771f0171097a171dfaa7e34f75c1c9ffe91672ee15137a02d +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_14-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9641f19582148168301fcbc77c1a4c81da1bbfd3 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:533528e5256ea5cdf26cfbbbd0b7fcec38676d3a75af250f57f30fae8e391d09 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_15-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c441001ae5d5f7a97aec1330c6023298a5d5f86 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:844670c410cebb32841d80717f8fe522f21a11f76547f98bb7e817e03ef7d60a +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_15-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68ec3725cc2355388e5afc9e36c29e92b2f38d9f --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96a07d765d52d9bb56cfcdfed0e4751007b21984a691c470b0c8ba6351d6251f +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_16-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..139feda5ce01b049616dbdbf2b3a05a0a824d382 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ab690d09ac33f1a2e38e5fb629a89d38cad09c2d08162c4f019c15313c2d297 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_16-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ad455cecb42c837f44333dd2339d04a4e121d7c --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2986894eb055507fc74249cdafb3ae1bbb3fe65cf50a6d6b0836cbb71d5bfd53 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_17-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8f6f9dce64937463507539b2a54582e8ad98881 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adad2ce5aa84626e142a9225e5bd04ad780ea7434f85f84bc57d1382f90eddb2 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_17-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b785c995da8711e6bc933f6f4687037b1d5ff2fd --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1778854976a3e0d9885da1ada096f963625633f50359c40def170c9193eb9518 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_18-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47e70c43c609462f15e93556dcaa487f8da23a82 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d2f274754fa98e47f96a9d53e17e818ca6e218b6c47ee0c45286ff7ab5bc993 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_18-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..299aae34539799f2ce8caf54a4a96151b1340cbd --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61dd8abf23f6b368978d8d72b12714ef9e4756292c116115284add4210c37f02 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_19-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a1f622794cdd415131fcca5a9c5494e074da809 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4774f118678bd7f2341397821382008b37d5cd3d4a508e8fe4f7982280164687 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_19-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a0ef9ccfb3ae9e53daeef2908913a4f9850ece8 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:849d3767140761be17b1a8c126bf12a427df183b4efc897c6c94c28a079709d0 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_20-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67e9391815107859b4ac5478af7e99c70d4129d1 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b11c63452d5e98bc4a54876b7ab164b2e85489a89bc435e613195ed8ffc0046 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_20-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4f52b1598d127a9d379dc627a91b0de106b3f02 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c2209c2a98be45709a49c7b31fe36d18d842ac230d729e643f3a799bdddcc0a +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_21-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea9365ba71cc38be790f8a1974b94c25376f986d --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d7fbef4821fa0381284f9fb8e2b6f0c42206b7d3fbcb01c117f1adafba1bb12 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_21-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a81619e4929269691ee16fe15d4096426fff337 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:569d04cadbe1a349188a625d20aefc8ec46967db821ff03a2ff1508e1babf726 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_22-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5c027abea5317606399e86ee682a18ec3a510e8 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b03c968af4c0396c0d65b995b885d006047a4ded75590b559d4ac508588bac77 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_22-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08fb28a42e567233d69446f498c62d5514517531 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9cf985661f9b0efbf0bd02d457526d70f7d33f2577cd0599a8f2c026416947c +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_23-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71323905fb4d760be09176ae96c802609ad55b42 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a266da2b1f68657e75c164a025d61264e51e26dfdc1cc2721573d59a0048a13d +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_23-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3af198be1a799e084dfc52ab2c5256630c6ed2d --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe4cf7de9fcfdee02c925b97a4045526a8cd0ed22817de9f46e492e09768caa6 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_24-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53e78b7abf8f92c1f50cb9ebae0141e47c359ff7 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:126ba6a2b10944f13ca936aabf1eae64e574e9601a3961897ba5f3cfc053196a +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_24-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62e4a452474b4e9d284820a96f7419174a81b570 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d325007ff8b8bfbd820342d9a0daf156b13e75fb448c44ce0cf84e19be7f484 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_25-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a6b133613fa4a3592ceed1ec410d4989b8ab5cd --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41f62dea3a01866030bf0282973cc4b7744c0d4802f72914e7cf88bc4f5efb8b +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_25-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4149dc342fd905fdbbacfe63fd1eb4a79dac389f --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31c1d1cbed414c592267c948270ad9bbf51346858f4fab8626c973fef1f7f058 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_26-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29913562ed22634fa46d52c305bb3a60ca573a8f --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d11dc1bbb1acd8deb6a8438d372cb7027aeb05e60e980f466879e3b1a95c8e47 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_26-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..acf32acb5104b23f386842defd3a808e8adefaab --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7549a145071e19c08bdd9ffa068eaa390b2a50ae9350473c0b6287f6b5f9208 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_27-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47c30bfe9ef459b0838882482f427e3318a4a545 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7174555c504c969d89b735728d28e226931931a075790030c721834f38387aed +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_27-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dfe6e498b080a631c32d62315a734bcf0309092 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4443d2ecc0594ecb4253ebb0a9b7fd019fa705d755100f07502b1a0669cde1c +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_28-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3adf8b09ab1c4baf46daa8bd1e1b13fb9a4c6123 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16232aea58b2cd1d362139abb7277de44f4dfe47c0df106618135304bdfb7261 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_28-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42d64cc26deee59a97f7e32ce533be6aaf070f13 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98b8747335623acd6f68bd4b61cc665ab378e7ada2900ec1c169318f3895f7b7 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_29-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29ed184976ffa8f7ef38bda24ea9f361da3f727d --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cffe98719890c92c36ede790f1fb70bc261523a1728250d1e9d161743b41cac2 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_29-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..310fe6829978f67efb8c675092a595981c92bc68 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:303ec356c04579c6e3a4f7c4833b25fa51c4b66ebafdf3191fc60914eaf3c7bd +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_30-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..442738f70ea76b5229bd115ac7ebd5a649cb7b9c --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:719f44dfe43a9930e7b2fd732bc84eda59f2e83ebf25367a25720e02431e5d18 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_30-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dbf76831ea076879b2230f4d341920432ce1dac --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e8ce7c26065ee60cc95305eba1be7e09b7db452e01d7c26b6cc6339c20febfd +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_31-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca08899cb1cf34da1d6b56454efc76cbd0c4ad93 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6aaa5d1f80c758b4d783753de2c8dc18548a4f1cca01763f7d01ab43f2f91fc3 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_31-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1b8611d767f80415af3e5f23a871c23aeef3b8e --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8dd2cc3adf3dc06c737fb45790f0a07a7cc9841514729c2870df8208e966383 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_32-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e66a39aabdb186d736a7abd0ee0aa65dcb5bd627 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3c3a666039e6ab725d31008f2833c52071043f5dab7367e924ea03d511c7d67 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_32-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b608e42701bef35b879eeedcfb150206fc569c7b --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b097147ab160e741a6d1f790196d1f901c26130f36d9a42d02239871ef7140ba +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_33-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67cf97dc050aef3e1e0bcf937dcf227856115ba3 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:004af62bfd94520b0eebb4cf307becee4674d1ac236c859d753a5c6c6ccc8710 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_33-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd8564747c247f823b555c36d6ac7e009438f441 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b17dfec7dc1ffff7e08b23f63191226c3792119747ccc5d5b45fbf357d138c6 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_34-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b71d0b1c094799bb7cd4859609c1990d7938f767 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c6ff235a79a4c5c9dea3f529ba5e580f7d58b28d5646455f2d3ed940230282d +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_34-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82866b5aabf1ddb657967ffb258b5570903f37ef --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:051fb252d9fe84ca1eedd6f9e0b8ee28e54cda739ef0cb6975526f49a0e43694 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_35-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..efb030d6169e6da220d561d9c6f56513241ee1e5 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afcb97eabd3f4d4682d9b10a0104cfb356a1599ef86d2b8f0bc46e1e29ce90db +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_35-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ef2ea56004b90cc74ed830dc830e33b89fb413b --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c079858d2117eebdbbb5d53f42e8f8eeec6bb76740769aa4bc3cc998ed85707b +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_36-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a53c1b4bee1fa95c42296bd66eaf8338d1d0b149 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b4c02f611d712b325b995f2aba7607372f6acda91a2b306d75eaf5d8c5e6f11 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_36-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf362e9c919836e76278d78614a71aac7becea6a --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9dea6f2ce0ad64a46d07b99943fec6db45db5f4a67622982d9eaf679cf870d0 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_37-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..177e8218285e591e1666463044b64c73020293e0 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f185e9018d7b8d3745d7b670582399f4719a6af2e1e56409bd44128e2caf33ea +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_37-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6049cfdde3738ef1a1710cbe848d9184c0722bd5 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0d618b08d7ffa95a413df3cf9825c989625378f4a8b6f19b3d2a96e644d175e +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_38-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a0e71a4ca9a619840002b81c5c98bff9c293113 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3a838cb1f65bebca47aa5cb330464ce0f60d94ebfae23250ea1a554e02b90b5 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_38-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb17a3a0de0bb05513eaf698a178c7e56d460da9 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d78976ba3514ed93422ea2a3ff19f7615c7d2ebfe7cccde6fd9a7e4e9ecfffe0 +size 113308931 diff --git a/4b284b6boscar/global_step80108/layer_40-model_00-model_states.pt b/4b284b6boscar/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe788280c5bc4af6cf8f6f33aac73ddcbe9a71f5 --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15f4a964b6194fb52a20acf25dc14caeb643eede87a603e9579d1e0af1c47582 +size 13507 diff --git a/4b284b6boscar/global_step80108/layer_40-model_01-model_states.pt b/4b284b6boscar/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf30259fb8fb54d0f632c3d28632734f76054bfb --- /dev/null +++ b/4b284b6boscar/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16c9f9624fdd29c285e5893d8229141d1c89818bfdf13c6586f824c44b11124f +size 13507 diff --git a/4b284b6boscar/global_step80108/mp_rank_00_model_states.pt b/4b284b6boscar/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ceb0cbbb0008103d39959e09bb3fea7375f0adb7 --- /dev/null +++ b/4b284b6boscar/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48f7c684a35f6ebaddcd8afcf5cb859afaa09318e719e79de9f049f5a7998c97 +size 51635 diff --git a/4b284b6boscar/global_step80108/mp_rank_01_model_states.pt b/4b284b6boscar/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4074f86c6654a2cffcc2ac68f44925307827bf0 --- /dev/null +++ b/4b284b6boscar/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:458f6284521933969dca73733bbc674cfd8a8d931db9689739ed70ceb4e6eab5 +size 51635 diff --git a/4b284b6boscar/transformers/config.json b/4b284b6boscar/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b6boscar/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b6boscar/transformers/pytorch_model.bin b/4b284b6boscar/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..e978995f237f5b96cc4c803670400fa0f854e7d4 --- /dev/null +++ b/4b284b6boscar/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9955215d07b5547df3ee9ce09303843a407768aa2511753d3d4614f8dead1af7 +size 8781203669