diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..06c9c27f2822085839f65a14b1b1c5808be1104e --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.37735446471481876, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03627756616654335}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0770951414018354, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0016045271434282637}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.32071402180605507, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004605078296811788}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11660803455743125, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002092415000785059}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.036415277664524216, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009758440561531726}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.15772225366490272, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0032080616090033745}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05551128171851163, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013139706655432171}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07386003315833899, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014481551839227544}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3123826157382853, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0045001843968478835}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11225387153032584, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019226335441299288}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07376812234473101, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014993347968782623}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3075886721444383, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004330300847827791}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11169551049560707, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019597969064310676}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..4ebe8a01f32c2434678bb9d50a8d3e15d2d47bf2 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5955492347128004, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04098243772631065}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.08263899702993936, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001483174937834192}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4023666815632534, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005245336574571597}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12834095324411207, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019248518716807731}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.039217284731154656, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009170392495425271}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20543752587672504, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003913508994823848}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.061270467324873235, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012492449538634826}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07806911458526311, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001322862559894183}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3835240834246368, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004954856771984596}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.12158319023743391, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017288009789448422}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07810015746385479, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013877161994542311}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.38024068911899445, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004835861426173133}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.12124370085382484, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017887287009066164}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..2f7711cb4d01f14973f0adf2e6f5595058357fe4 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6719567149622531, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04451490063633614}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.08290888658614914, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0015350215758182237}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4194244346322516, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005283499761780351}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12936180136586783, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001954303430193513}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03927899079960598, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009493902598473397}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.214648184705714, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.004017055136123084}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.06151955178238632, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012577473248259622}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07707538779187502, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013161012683531753}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3915395709801734, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0048204418807369295}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.12064349526703928, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001720033258665151}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07820442311124796, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013841071483193569}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3953219549146526, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004864683263901412}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.12216673770750221, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001800956219634565}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..2b82c69cebae9066847300761cd210701005a040 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.7030429320938599, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04228909607379892}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07917967419538707, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014240165968682841}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.42024267058618486, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005232177743876596}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12494961329088779, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001871934588598472}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03673571584796494, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008485900852921835}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.21159361761560835, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003896974137970697}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05835931677377586, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001172617966432863}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07289709850715816, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001220535361848458}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3865171662156251, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004668856621947524}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11519873729255874, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016320470107472416}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07468731684101934, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013010266610264402}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3950249369083203, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0047835320890464855}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11782366546024012, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017256698791084089}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..0f41773b87c2be0b8fb7ed3641f65e7f90b17542 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.7009084921005813, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05429101270641276}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0787656137813602, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014303284095470072}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4198316942830002, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0051407465648353945}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12409393489139078, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001785975484122767}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03711436336217505, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009399506148593571}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.21491818852062866, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003973307675575708}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05863215249774496, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011389709231231604}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07260277037447828, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012668906951770727}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.38573795956761925, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004591295339002268}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11439156159112489, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015688033893795825}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.0744525796262277, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013359002532122982}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3952770689440709, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004713626458568202}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11724728813607507, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001670529322751021}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..3c7f04f93b1edbc8d00925537de9f53f8d559c4b --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.7813605370790605, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.044236747351497484}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07910701465761572, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014814464979107673}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.42965787368823066, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005259601751094787}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12489900535257513, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001892834896809631}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03705119454588921, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009271466855999936}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.2180047518637017, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00400770350410333}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.058674755789965206, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012025616483889573}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07219818322662526, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012976343736866773}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3913465741327545, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004618454191060434}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11391088630556961, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016293445333007116}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07484317706922312, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014014602911312686}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.4051096507534578, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004862305392822499}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11797028786316605, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017753435966714796}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..bf8f55322e2e5e4f316829ba6134488516436f80 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1472006912589573, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018081532683583343}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.25280412679250724, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027283406577109795}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17278267579995407, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001805309989869822}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.02800882087488719, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007031555613566064}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05161999521321001, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014471575437312986}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.033403065447518296, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008091708062643894}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1151686636057282, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012754431121468031}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.20439066404636233, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002231774421791313}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13668346985187405, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013073897309746026}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1342468034278481, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016375746774704983}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2313321529160814, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002494421485097423}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.15765023763708086, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001625669978151679}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.4207573221891459, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.060668680742149504}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..1804b6ce44c554e6b29dd5014821bbe633976aba --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.19794818451477075, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002216007848664949}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.3284489945851762, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002997251491577378}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.22635289032885908, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019797732821072913}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.05003816092030399, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010440179296527974}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0863451197200493, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0018333871572600053}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.057255731342826154, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010651766443270621}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1385898377468809, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015132970995651801}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.23662979084247882, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002337708767980629}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1592439241741607, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013041393201605942}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.18480829497363066, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020842494081539653}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.30748871703201347, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028452982805044153}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.21134027415429807, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018497593685481146}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.863520294428325, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04821407211996815}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..35dce510d1bac972c391719d494349b13666afb3 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.19406216075430627, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0022851568065445846}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.30801257358803485, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002815672688199465}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.21621899679871145, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018861785936639156}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.04969349334752031, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0012211667072253483}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.07912027885387732, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001712170031568902}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.054139172220906376, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010468476711488718}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1390654173595737, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016872675834548336}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.22587848754502876, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002267886826339719}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15514555559600926, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013211824425543813}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.18238320998068505, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0021483718861069925}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2906352040127194, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026915444202120025}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.2033687466390169, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017670650217538845}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.892049675027145, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05098830000976219}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..d8de04fed6cf43e7b73fc92cf503fe376590b54d --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.17111604893495974, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002666234365501737}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.25241562149299535, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0032749227911704902}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.18012746746417807, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002211658008220921}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.04327701615115013, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001228777572136881}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06549662087884625, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016995103815543647}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04512193425646708, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010254911232422685}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.12471745040277263, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0020684991761244493}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.18654805673867839, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002583812297767984}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13030697479391384, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015820227940213536}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.16128332553163546, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0025338005143025694}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.23839128203771087, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003113680952409177}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1697095188842209, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020776929681688918}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.9015609655711327, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0731100382224477}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..293ea444201cf8f952ea07f1c340e7e607d5bcc6 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.054570512553222275, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0021295344255454545}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.0795788085275046, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002819526024958868}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.0547919221475693, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018695427841614045}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.012963816979253771, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008570339066074451}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.020089181351346234, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0011359068136854778}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.012956061411719485, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.000654310189300764}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.04143340245616873, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001670845773969632}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.060916796276303795, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022168298240763207}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.041080312014145574, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001390509184087734}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.05115883129564417, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020129461932352306}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.07453932183957888, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026507114407709974}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.05125820536012792, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017489799459199928}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.5498632715838676, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04532412143006689}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..c982ed3220af93deedc6eb471ae1ab8b5f23fb7b --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.009254019379187583, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0009687953589273818}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.012906851032002356, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0012462005287005372}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.009074928433158342, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008689330426263544}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0024187488668729984, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00044284833188613796}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0031816545395102693, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0004382892858640001}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0022561594203614308, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00031382246712575974}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.0070282827330193105, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0007783399245473895}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.009802719504705336, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0009814452084083668}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.006803875534069048, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006705094104727261}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.008596891531763053, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0009017346586956089}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.012142210310286464, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0011816152654071754}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.00846353027326687, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0008128006829974675}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 7.095551523492589e-07, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.483647929837512e-06}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..eeac7eee2222c1de9da00b6e296b6d93eb5ed5c0 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 0.4098344694476387, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05659734906094685}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.08028081330149647, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0015384112652978448}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.04939996548808655, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0013089989862407679}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.048385938607711065, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0009554921914241868}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.0027541218407848736, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00035092238584102253}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.0033678792789505574, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00032239765676952145}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.0024384647317544604, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00023457941137137737}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.07933411355241447, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015031308017294464}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.04857484893118309, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0012730023314328899}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.0477602327181495, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0009369815165680327}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.07839335233527917, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014996927491176875}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.04630917456025576, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0011796155371411761}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.046214076424090866, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0008828068716652509}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..9631f8a7db3db9702a1543d517e7d2e34f652508 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.566579816189526, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1008934461871328}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5476584258558421, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003456480736532219}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.41369520299915363, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0030436852499156355}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.44235732853210524, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023941703294020514}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.26480819367826736, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002815017462568761}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.1947916755785088, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021369452000412747}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2090655371625227, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019982452977907856}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.40566221817688664, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003117710931571736}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.30207439523525703, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024361075306840673}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3244139780407101, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020695436330019803}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4515596659057806, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00330045757816753}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3391748876129398, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002736309734827984}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3633576021387155, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022990935361642674}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..f59469d78e5899a8f1abe0af871b8cea652911c8 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.388773838263758, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.15855873725678352}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5789198401113218, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0034646581707259965}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.43386579914021006, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028978275527303445}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4668734222692764, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002246846357740528}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.29695825419975175, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.003050205383079884}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21537221020252503, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002178321767423481}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.23283198535704958, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020561178954031285}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4435501207130385, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0033174896772021436}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3283330300619082, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024660245741253578}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.35447078432499324, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021030174285698792}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.490510155822524, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003436994721582442}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3662609564143789, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027327897367931055}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.39454340194994386, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023023116088308807}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..544b3811fc45cdf7fabc51ce82f6b10611a3dba2 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.332946272100804, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.18137970117023247}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5793041287934014, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003372992411703443}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4438630375906513, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029246450295944823}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.47410403700383463, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022235093842193814}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.30259452883798293, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002973225867205113}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2262470005601965, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002281252913319087}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.24214353888062579, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020914337667352996}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4446517195178283, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0032644622543037123}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.33699099215579725, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025380393382758446}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3610728360004429, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021477160139884146}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.49295247754853494, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003364958172666197}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.376746301427234, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027787439904039756}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4027299671398636, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002308027196519871}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..4ddcc1335debc81fdcd5fde61c24c29996226104 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.060665357528471, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.26445377512594503}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5812217022092131, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0034309298270467957}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.43567025831059786, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002843591723717016}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4710196471035029, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00223956317877308}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.3024182514661336, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.003059613249842079}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.22039519212546937, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022450567626817208}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2391776138295886, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002129468559557926}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.44652148397509384, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003277961495936333}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.33135080522129373, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024514490127927014}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3592882674955681, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002128255611143205}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4943861067221433, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003406003991655421}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3698962329844, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002720553601988623}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4001617252953104, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023226135429815936}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..b2e9f4a031a50940eb75a330d1ea0558b8393abb --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.308593309054016, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.14306952311664156}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5775681396669916, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003331795685464776}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4402215693743334, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027531550513425758}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.47488846126671874, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021786011409350068}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.29979953949402255, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0029503967662262848}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2224041099843757, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021904880519093752}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.24094008936533884, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020801259022813117}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.44250221759721664, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0031886562916719433}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.33425438519938394, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002422039927744084}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.36154908902057886, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021160968101490625}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.49255025128439295, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003325987333005444}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3748555131665994, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002667744873458217}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.40460308229003333, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002297073510569085}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_gem_xsum_article_DOC_summary_0.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..6786671251c1a3829569b81a11ebce95e9a853ef --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1613424323587368, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002278376950302783}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3330533490420518, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004383443983456259}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.2087853046997779, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025328837093340183}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03314422437427033, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0012522698778844542}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07302060035369815, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0026623802488437657}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.043870150801107066, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015541821908238338}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.12067382175182433, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017342073690786556}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.25037736095962637, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0034248848896776688}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1562890353716468, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019283406025933057}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.12496312472870656, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001832956489326573}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2617586907885203, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0038506762926574915}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.16248318414135096, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021310634283090322}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.9479708786806795, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08014965365678729}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_gem_xsum_article_DOC_summary_1.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..fb21b49b7ec3e706c75fa449160a8d7e677e5d8a --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.13272782271590566, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018764384818534341}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3267515350090506, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004353020039146078}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1865319266668177, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002524634111297582}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0286660681091914, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001013349141668393}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07362289198488865, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002707772359921043}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04075132217381377, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014397841016716487}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10272547144552927, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013800002526758255}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.25572197637104055, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003442070323824128}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14475331879083578, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018814005333497661}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10462377645973141, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015282810270458372}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.260731647450524, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0038051114474756866}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14751402177418876, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020984330928484275}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.6036382509204854, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07096687163435135}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_gem_xsum_article_DOC_summary_2.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..b752dc333e0198b88ef45172c70049a1b9592fcf --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.13076052871501112, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018792476759405042}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3221325006706253, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004397231507997294}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.18378435325514345, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002535460776839407}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02746291848253061, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010036620622712227}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07033120823579617, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002679121665145769}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.038998510414389495, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014233539161123735}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10140981704363383, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013659104358610527}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2519770493702287, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003389522634128558}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14281263909344286, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018586972576843518}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10292716745077025, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001493393265112054}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2564707137279286, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0037227133454889715}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14511393337009704, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020497175410351316}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.5160558945216587, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08240737955012244}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_gem_xsum_article_DOC_summary_3.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..d4261354a9a364336500148068dfca2ad4fe615f --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12752846466949222, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002107108659509441}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.30226873054413106, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004603263404573647}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1755472401383986, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026658088779740008}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02656552305156673, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010143773775889025}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06679540752654423, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0026398777724888113}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03728687717351484, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014073859223946697}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09973634913453447, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016065186547029968}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2381694226551552, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003581000725397854}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1374413682741159, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020025230497704035}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10128532281127449, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017234587079133783}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.242387646401674, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003912550948546174}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13972451850744902, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002189941237196646}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.4838319001573719, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.096950687868892}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_gem_xsum_article_DOC_summary_4.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..ace834e7059edb8165a23174f709ad8e62b8b902 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.04055839800057727, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002477310590755891}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.075289351379979, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004369683499123559}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.04778183046984643, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026876876154109395}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.007387682998651727, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006990296012429621}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.01658715369278413, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015969348183973628}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.009890919687627312, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009266580590961874}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.03201249080708822, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0020286497636226534}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.058963105965077874, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0034421636677800026}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.037129528917459374, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002067815641725132}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.032870357769899584, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020908192203781383}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.060477341143397076, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0035760110748676577}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.03818253053785788, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021629296440312594}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.7569692825353468, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08589568488878548}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_gem_xsum_article_DOC_summary_5.json b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..ffd1bc2d84192535dd868121ab5c1c674663928e --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/agg.4b284b28bc4seed1_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0027310061588494907, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0007639869380554712}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.002278390688529166, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.000653161458483614}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.002428042108949549, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0006836828342851362}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0002712711508493972, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00014357866607635477}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.00022836178496555851, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00012848868152370965}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0002457908682882255, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00013419496972284081}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0019627628749802942, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0005482087057123049}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0017131282019251252, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0005120016166906651}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0017821424924565805, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0005116719884636547}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0022448445249864724, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0006188549077092995}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.001918332943289463, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0005536248619504823}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0020181296932120095, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0005652424749866139}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 4.750583931400068e-39, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 8.063749129795418e-34}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..440967b9931f4f63d539b59507ba44d20b59c202 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2b18086f9956d5234b45ce844dd01d7d174582c1bade83ca7bcbb0256e17dd4 +size 4118889 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5f166c2f49c3b4b9b6a65503789d7e81b712fe9c --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8582c69a94d9214076f76cb72251f60254083b079012c9a43d51cd1278e08d16 +size 5063208 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6cce8c41da45af7e2abf29ab02a330e8a204b46a --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37613a097b4d539d989c7f3fdae6e2cb9c56945f9332bed946d150c4c98045ed +size 6001051 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0e414965e058b12f9ce86a8dcbd4fd329f2b7fd3 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a04aab481d3f41eafc30e5e84bef6a029fa8b9e9e32830b2d8ee0c11af4ffc0 +size 6946105 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..81965ba406aac50ed95894a269a0f6790bb9970a --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04f8342775627473602ca976f7265598a11c8994004b629f1011224c8da2579d +size 7853382 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..bab0f97b1d19d22c42475627de7da9cf062b97d6 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:640c23709d7db9aa4338d06c57a93bc3468a3baf8aa6d60f2519c1ff9ddc8645 +size 8777008 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..dd349bc8642777cbf826ab860c94d4df4b64bf20 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ef5519e6eaea810aa454d64adfdbc4cbea818d57383287f9bd2496ef3ab6a6f +size 7705557 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4b3a8774e00d29461bd700163e5c7ed7511286b6 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd5aa4072b20e2ade08b182d172079d44b57775b757bdce244b0de57a812e98f +size 13309286 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8e41ea519ffbc1ad5a7524d081866f13da9c3c5c --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94b5b29565f3540a5caafc13fd3f8230897477b6f4336b8e2064ce184e471390 +size 18900724 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5dadf6823c792b2668bc4e0eb1187fbe7968faea --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4410b8804f57b48298b2c935f00bd0c2a80b76068d92bf6b436680f251bc195f +size 24314614 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..75b7196fc2bbe96ed93dde9de13f46ab96a22172 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:726ecb390bb836e072861e432b712c134f6ec46096163db538cc11dec62e52cc +size 29462880 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8b574222f0857177c49ca10ea5f578bb2919de20 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ad16a49886b797d68996a898c53aa3f06b0ce465c7bd579044f9e31afb1576e +size 34797980 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4bffa11c921a666c52021c1c8250c0942586ce07 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d850d064e35bea00467fbc018132115d11abb1ae17458fd16de4edb82b44dc8 +size 3895782 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ec36a6c5fda1384140dabee6182695fd1b146358 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:221bb095a395d862cd2ed63b83ad4bbac5f1be999b1565ad28819b822001ba91 +size 5021331 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8daaa8f05b3f10e25c69e12fbf5848f5dff762ab --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:560d61e8c62049f60a67652ce2f2fefa3436818bd1c9f5971b7f16d9a2c94bca +size 6098780 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6701ed60f6dfa1f246f77ef2782f8d3bf1d6edb9 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffeea2f712a5d43a01a714f88cd0ec92eb570e3b796f60d5eb8bc8f0d170f0f7 +size 7184980 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8fed0b4a743d5573b592bf3f61ee248aa369fae0 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4be8cab1a5c9d9b73f552be25852b52d4459de53bc9f7deb47e7ffed6da75ae3 +size 8257644 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..638f0f5ab865b911427a2d1b0a7fde351bb017a9 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2318be9c80d0d3e23ebf9a1d9a0045008190880c8c8da947db79ede8ed032a37 +size 9349490 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_gem_xsum_article_DOC_summary_0.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3695e7924167b51693afbcbc5e1641698aea0018 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bbdb384e3734de5965d2ea8e913ac52afa52553ad1c460ae752ae7b5ad2b2f8 +size 2800426 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_gem_xsum_article_DOC_summary_1.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e52b6f6fc5f9fe0692a21c88017755c4525d85a1 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5839e93a69cd0694c7fe7d8890e9012d8280a42dd23c48963e59e82a34d9ffae +size 5102739 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_gem_xsum_article_DOC_summary_2.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..069d2903c6ed15f7bdb32f618b84dfc0fce51f60 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4789e7ece61b840f1b98a4bbc2af0a6d6e199c09b9a834958d571079f8f27c7 +size 7376442 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_gem_xsum_article_DOC_summary_3.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e75f3e440b136826bd54e4f54c867f7290c5eed7 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e44a762d882baedf020ac0521262c3fc880bfe9a7ecba35e4f005f4ccc5335f +size 9644200 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_gem_xsum_article_DOC_summary_4.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..bb5b4ec4cb1ae78ff9b24fc6bdd8602b9e04c222 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:293e6f0a3e3682345c718b024bf422f6878c227f8f07875556ecead454d6595d +size 11671008 diff --git a/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_gem_xsum_article_DOC_summary_5.jsonl b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d9f12ae91f508776c4804bb05d49265bbdd3c2b6 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/examples.4b284b28bc4seed1_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcdec5e3529cb1544a7f62815f2dbc0f413dc5fee3474ebbc5bae23e11f131b7 +size 13897548 diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..d5ec7ce78206eedd42586e70ae5bb613fcd6f674 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.37735446471481876, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03627756616654335 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0770951414018354, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0016045271434282637 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.32071402180605507, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004605078296811788 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11660803455743125, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002092415000785059 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.036415277664524216, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009758440561531726 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.15772225366490272, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0032080616090033745 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05551128171851163, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0013139706655432171 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07386003315833899, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014481551839227544 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3123826157382853, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0045001843968478835 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11225387153032584, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0019226335441299288 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07376812234473101, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0014993347968782623 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3075886721444383, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004330300847827791 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11169551049560707, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019597969064310676 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..62565a9cfd78781e6b3b85427152e245a5cc926f --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5955492347128004, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04098243772631065 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.08263899702993936, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001483174937834192 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4023666815632534, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005245336574571597 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12834095324411207, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019248518716807731 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.039217284731154656, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009170392495425271 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20543752587672504, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003913508994823848 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.061270467324873235, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012492449538634826 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07806911458526311, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001322862559894183 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3835240834246368, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004954856771984596 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.12158319023743391, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0017288009789448422 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07810015746385479, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013877161994542311 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.38024068911899445, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004835861426173133 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.12124370085382484, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017887287009066164 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..7f061d76b921ca78ebd708ccc982b25374573595 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6719567149622531, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04451490063633614 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.08290888658614914, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0015350215758182237 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4194244346322516, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005283499761780351 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12936180136586783, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001954303430193513 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03927899079960598, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009493902598473397 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.214648184705714, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.004017055136123084 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.06151955178238632, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012577473248259622 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07707538779187502, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013161012683531753 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3915395709801734, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0048204418807369295 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.12064349526703928, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001720033258665151 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07820442311124796, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013841071483193569 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3953219549146526, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004864683263901412 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.12216673770750221, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001800956219634565 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..58a66ad63186c27fb4af745eed1d8f76ceda76a2 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.7030429320938599, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04228909607379892 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07917967419538707, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014240165968682841 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.42024267058618486, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005232177743876596 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12494961329088779, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001871934588598472 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03673571584796494, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008485900852921835 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.21159361761560835, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003896974137970697 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05835931677377586, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001172617966432863 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07289709850715816, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001220535361848458 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3865171662156251, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004668856621947524 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11519873729255874, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016320470107472416 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07468731684101934, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013010266610264402 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3950249369083203, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0047835320890464855 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11782366546024012, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017256698791084089 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..e7abae5782e13dfc6f2129f95ed0c35414bcba46 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.7009084921005813, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05429101270641276 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0787656137813602, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014303284095470072 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4198316942830002, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0051407465648353945 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12409393489139078, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001785975484122767 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03711436336217505, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009399506148593571 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.21491818852062866, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003973307675575708 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05863215249774496, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011389709231231604 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07260277037447828, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012668906951770727 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.38573795956761925, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004591295339002268 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11439156159112489, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015688033893795825 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.0744525796262277, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013359002532122982 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3952770689440709, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004713626458568202 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11724728813607507, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001670529322751021 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..d6b94ec4c26fe4bc38f5f12e713259156ad61c9c --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.7813605370790605, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.044236747351497484 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07910701465761572, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014814464979107673 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.42965787368823066, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005259601751094787 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12489900535257513, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001892834896809631 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03705119454588921, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009271466855999936 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.2180047518637017, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.00400770350410333 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.058674755789965206, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012025616483889573 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07219818322662526, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012976343736866773 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3913465741327545, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004618454191060434 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11391088630556961, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016293445333007116 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07484317706922312, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0014014602911312686 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.4051096507534578, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004862305392822499 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11797028786316605, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017753435966714796 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e318b97830c800e34eb1af12fb4e66f10c3f4925 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1472006912589573, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018081532683583343 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.25280412679250724, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0027283406577109795 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17278267579995407, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001805309989869822 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.02800882087488719, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007031555613566064 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05161999521321001, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0014471575437312986 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.033403065447518296, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008091708062643894 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1151686636057282, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012754431121468031 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.20439066404636233, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002231774421791313 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13668346985187405, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013073897309746026 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1342468034278481, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0016375746774704983 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2313321529160814, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002494421485097423 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.15765023763708086, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001625669978151679 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.4207573221891459, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.060668680742149504 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..ae5be09a1541b272bc371a671784b44b6281bfb6 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.19794818451477075, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002216007848664949 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.3284489945851762, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002997251491577378 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.22635289032885908, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019797732821072913 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.05003816092030399, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0010440179296527974 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0863451197200493, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0018333871572600053 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.057255731342826154, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010651766443270621 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1385898377468809, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015132970995651801 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.23662979084247882, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002337708767980629 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1592439241741607, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013041393201605942 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.18480829497363066, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0020842494081539653 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.30748871703201347, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0028452982805044153 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.21134027415429807, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018497593685481146 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.863520294428325, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04821407211996815 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..30031c10556f72b526790edda02aa4097c2d5605 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.19406216075430627, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0022851568065445846 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.30801257358803485, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002815672688199465 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.21621899679871145, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018861785936639156 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.04969349334752031, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0012211667072253483 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.07912027885387732, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001712170031568902 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.054139172220906376, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010468476711488718 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1390654173595737, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0016872675834548336 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.22587848754502876, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002267886826339719 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15514555559600926, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013211824425543813 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.18238320998068505, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0021483718861069925 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2906352040127194, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0026915444202120025 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.2033687466390169, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017670650217538845 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.892049675027145, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05098830000976219 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..b533ac31ead11125a32cc125b3d1f972184352dc --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.17111604893495974, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002666234365501737 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.25241562149299535, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0032749227911704902 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.18012746746417807, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002211658008220921 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.04327701615115013, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001228777572136881 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06549662087884625, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016995103815543647 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04512193425646708, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010254911232422685 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.12471745040277263, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0020684991761244493 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.18654805673867839, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002583812297767984 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13030697479391384, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015820227940213536 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.16128332553163546, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0025338005143025694 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.23839128203771087, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.003113680952409177 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1697095188842209, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020776929681688918 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.9015609655711327, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0731100382224477 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..da195ad248cfe25498f060ebc9f21fa025feb84b --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.054570512553222275, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0021295344255454545 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.0795788085275046, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002819526024958868 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.0547919221475693, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018695427841614045 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.012963816979253771, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008570339066074451 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.020089181351346234, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0011359068136854778 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.012956061411719485, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.000654310189300764 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.04143340245616873, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001670845773969632 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.060916796276303795, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022168298240763207 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.041080312014145574, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001390509184087734 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.05115883129564417, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0020129461932352306 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.07453932183957888, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0026507114407709974 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.05125820536012792, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017489799459199928 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.5498632715838676, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04532412143006689 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..a8e5329d8ec61439e7051d3b0014227027e8167a --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.009254019379187583, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0009687953589273818 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.012906851032002356, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0012462005287005372 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.009074928433158342, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0008689330426263544 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0024187488668729984, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.00044284833188613796 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0031816545395102693, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0004382892858640001 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0022561594203614308, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00031382246712575974 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.0070282827330193105, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0007783399245473895 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.009802719504705336, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0009814452084083668 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.006803875534069048, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0006705094104727261 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.008596891531763053, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0009017346586956089 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.012142210310286464, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0011816152654071754 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.00846353027326687, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0008128006829974675 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 7.095551523492589e-07, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 1.483647929837512e-06 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..dcd907e88467a92989941606d0c7591d58b55a2e --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 0.4098344694476387, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.05659734906094685 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.08028081330149647, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0015384112652978448 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.04939996548808655, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0013089989862407679 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.048385938607711065, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0009554921914241868 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.0027541218407848736, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.00035092238584102253 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.0033678792789505574, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.00032239765676952145 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.0024384647317544604, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.00023457941137137737 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.07933411355241447, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0015031308017294464 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.04857484893118309, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0012730023314328899 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.0477602327181495, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0009369815165680327 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.07839335233527917, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0014996927491176875 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.04630917456025576, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0011796155371411761 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.046214076424090866, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0008828068716652509 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..f11765a02fa2f9ed92d9c3f852d686788409cc30 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.566579816189526, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1008934461871328 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5476584258558421, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003456480736532219 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.41369520299915363, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0030436852499156355 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.44235732853210524, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0023941703294020514 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.26480819367826736, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002815017462568761 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.1947916755785088, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021369452000412747 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2090655371625227, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019982452977907856 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.40566221817688664, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.003117710931571736 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.30207439523525703, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024361075306840673 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3244139780407101, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020695436330019803 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4515596659057806, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.00330045757816753 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3391748876129398, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002736309734827984 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3633576021387155, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022990935361642674 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..7d46bad90645c2a5a33a07ed3a5fd36dedb899c7 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.388773838263758, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.15855873725678352 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5789198401113218, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0034646581707259965 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.43386579914021006, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028978275527303445 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4668734222692764, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002246846357740528 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.29695825419975175, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.003050205383079884 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21537221020252503, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002178321767423481 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.23283198535704958, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020561178954031285 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4435501207130385, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0033174896772021436 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3283330300619082, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024660245741253578 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.35447078432499324, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021030174285698792 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.490510155822524, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003436994721582442 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3662609564143789, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027327897367931055 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.39454340194994386, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023023116088308807 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..3216d60a48b7a1db237aebc4863017ff4c9aaec1 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.332946272100804, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.18137970117023247 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5793041287934014, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003372992411703443 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4438630375906513, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029246450295944823 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.47410403700383463, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022235093842193814 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.30259452883798293, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002973225867205113 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2262470005601965, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002281252913319087 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.24214353888062579, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020914337667352996 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4446517195178283, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0032644622543037123 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.33699099215579725, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025380393382758446 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3610728360004429, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021477160139884146 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.49295247754853494, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003364958172666197 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.376746301427234, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027787439904039756 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4027299671398636, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002308027196519871 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..dc0f9c28096b2e60500dfcdc476045eb1175b687 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.060665357528471, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.26445377512594503 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5812217022092131, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0034309298270467957 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.43567025831059786, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002843591723717016 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4710196471035029, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.00223956317877308 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.3024182514661336, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.003059613249842079 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.22039519212546937, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022450567626817208 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2391776138295886, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002129468559557926 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.44652148397509384, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.003277961495936333 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.33135080522129373, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024514490127927014 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3592882674955681, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002128255611143205 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4943861067221433, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003406003991655421 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3698962329844, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002720553601988623 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4001617252953104, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023226135429815936 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..bd302027b2f1866e9468f43cb22ce2fa609ad4da --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.308593309054016, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.14306952311664156 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5775681396669916, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003331795685464776 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4402215693743334, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027531550513425758 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.47488846126671874, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0021786011409350068 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.29979953949402255, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0029503967662262848 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2224041099843757, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021904880519093752 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.24094008936533884, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020801259022813117 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.44250221759721664, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0031886562916719433 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.33425438519938394, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002422039927744084 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.36154908902057886, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021160968101490625 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.49255025128439295, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003325987333005444 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3748555131665994, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002667744873458217 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.40460308229003333, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002297073510569085 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_gem_xsum_article_DOC_summary_0.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..c3217489aa1dbfe94f97adc692a70e68ca3d89f8 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1613424323587368, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002278376950302783 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3330533490420518, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004383443983456259 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.2087853046997779, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0025328837093340183 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03314422437427033, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0012522698778844542 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07302060035369815, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0026623802488437657 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.043870150801107066, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0015541821908238338 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.12067382175182433, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0017342073690786556 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.25037736095962637, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0034248848896776688 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1562890353716468, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019283406025933057 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.12496312472870656, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001832956489326573 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2617586907885203, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0038506762926574915 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.16248318414135096, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0021310634283090322 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.9479708786806795, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08014965365678729 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_gem_xsum_article_DOC_summary_1.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..e42ac56abbe0e0458148180bb0724f53a91b126b --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.13272782271590566, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018764384818534341 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3267515350090506, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004353020039146078 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1865319266668177, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002524634111297582 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0286660681091914, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.001013349141668393 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07362289198488865, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002707772359921043 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04075132217381377, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014397841016716487 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10272547144552927, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013800002526758255 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.25572197637104055, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003442070323824128 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14475331879083578, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018814005333497661 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10462377645973141, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0015282810270458372 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.260731647450524, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0038051114474756866 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14751402177418876, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020984330928484275 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.6036382509204854, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07096687163435135 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_gem_xsum_article_DOC_summary_2.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..e5a22a5678ce735aa6926310a49c6a85730aed11 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.13076052871501112, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018792476759405042 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3221325006706253, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004397231507997294 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.18378435325514345, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002535460776839407 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02746291848253061, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010036620622712227 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07033120823579617, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002679121665145769 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.038998510414389495, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014233539161123735 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10140981704363383, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013659104358610527 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2519770493702287, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003389522634128558 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14281263909344286, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018586972576843518 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10292716745077025, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001493393265112054 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2564707137279286, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0037227133454889715 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14511393337009704, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020497175410351316 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.5160558945216587, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08240737955012244 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_gem_xsum_article_DOC_summary_3.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..b71a33ff650b8491c376a1bda69df0613b378239 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12752846466949222, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002107108659509441 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.30226873054413106, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004603263404573647 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1755472401383986, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0026658088779740008 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02656552305156673, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010143773775889025 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06679540752654423, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0026398777724888113 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03728687717351484, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014073859223946697 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09973634913453447, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0016065186547029968 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2381694226551552, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003581000725397854 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1374413682741159, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0020025230497704035 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10128532281127449, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0017234587079133783 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.242387646401674, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003912550948546174 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13972451850744902, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002189941237196646 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.4838319001573719, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.096950687868892 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_gem_xsum_article_DOC_summary_4.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..794fb6bfd8dbc3e9a295bfa9af9dfda67fea3a31 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.04055839800057727, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002477310590755891 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.075289351379979, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004369683499123559 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.04778183046984643, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0026876876154109395 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.007387682998651727, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0006990296012429621 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.01658715369278413, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0015969348183973628 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.009890919687627312, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0009266580590961874 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.03201249080708822, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0020286497636226534 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.058963105965077874, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0034421636677800026 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.037129528917459374, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002067815641725132 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.032870357769899584, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0020908192203781383 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.060477341143397076, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0035760110748676577 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.03818253053785788, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0021629296440312594 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.7569692825353468, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08589568488878548 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_gem_xsum_article_DOC_summary_5.json b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..d5da811479c6c717cb9cb15ff7952ab788b9bfe1 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/generation/slim.4b284b28bc4seed1_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0027310061588494907, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0007639869380554712 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.002278390688529166, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.000653161458483614 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.002428042108949549, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0006836828342851362 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0002712711508493972, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00014357866607635477 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.00022836178496555851, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00012848868152370965 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0002457908682882255, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00013419496972284081 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0019627628749802942, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0005482087057123049 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0017131282019251252, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0005120016166906651 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0017821424924565805, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0005116719884636547 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0022448445249864724, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0006188549077092995 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.001918332943289463, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0005536248619504823 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0020181296932120095, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0005652424749866139 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 4.750583931400068e-39, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 8.063749129795418e-34 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_0.json b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_0.json new file mode 100644 index 0000000000000000000000000000000000000000..75343732033842b1fea79f981f5e728a7711897c --- /dev/null +++ b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.326, + "acc_stderr": 0.014830507204541037 + }, + "anli_r2": { + "acc": 0.332, + "acc_stderr": 0.014899597242811476 + }, + "anli_r3": { + "acc": 0.35333333333333333, + "acc_stderr": 0.013804572162314932 + }, + "cb": { + "acc": 0.35714285714285715, + "acc_stderr": 0.0646095738380922, + "f1": 0.1920045045045045 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909283 + }, + "hellaswag": { + "acc": 0.4814777932682733, + "acc_stderr": 0.004986356526063966, + "acc_norm": 0.6333399721171081, + "acc_norm_stderr": 0.004809077205343496 + }, + "rte": { + "acc": 0.5631768953068592, + "acc_stderr": 0.029855247390314945 + }, + "winogrande": { + "acc": 0.5919494869771112, + "acc_stderr": 0.013812822643745027 + }, + "storycloze_2016": { + "acc": 0.7220737573490112, + "acc_stderr": 0.010359403651225856 + }, + "boolq": { + "acc": 0.6058103975535168, + "acc_stderr": 0.008546995661233635 + }, + "arc_easy": { + "acc": 0.5862794612794613, + "acc_stderr": 0.010105878530238132, + "acc_norm": 0.5168350168350169, + "acc_norm_stderr": 0.010253966261288895 + }, + "arc_challenge": { + "acc": 0.2713310580204778, + "acc_stderr": 0.012993807727545794, + "acc_norm": 0.30716723549488056, + "acc_norm_stderr": 0.013481034054980943 + }, + "sciq": { + "acc": 0.846, + "acc_stderr": 0.011419913065098704, + "acc_norm": 0.766, + "acc_norm_stderr": 0.01339490288966001 + }, + "piqa": { + "acc": 0.7421109902067464, + "acc_stderr": 0.01020695666205625, + "acc_norm": 0.7578890097932536, + "acc_norm_stderr": 0.009994371269104397 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_0_lm-eval_global_step80108_2023-02-15-11-04-03_0shots_backup.json b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_0_lm-eval_global_step80108_2023-02-15-11-04-03_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..75343732033842b1fea79f981f5e728a7711897c --- /dev/null +++ b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_0_lm-eval_global_step80108_2023-02-15-11-04-03_0shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.326, + "acc_stderr": 0.014830507204541037 + }, + "anli_r2": { + "acc": 0.332, + "acc_stderr": 0.014899597242811476 + }, + "anli_r3": { + "acc": 0.35333333333333333, + "acc_stderr": 0.013804572162314932 + }, + "cb": { + "acc": 0.35714285714285715, + "acc_stderr": 0.0646095738380922, + "f1": 0.1920045045045045 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909283 + }, + "hellaswag": { + "acc": 0.4814777932682733, + "acc_stderr": 0.004986356526063966, + "acc_norm": 0.6333399721171081, + "acc_norm_stderr": 0.004809077205343496 + }, + "rte": { + "acc": 0.5631768953068592, + "acc_stderr": 0.029855247390314945 + }, + "winogrande": { + "acc": 0.5919494869771112, + "acc_stderr": 0.013812822643745027 + }, + "storycloze_2016": { + "acc": 0.7220737573490112, + "acc_stderr": 0.010359403651225856 + }, + "boolq": { + "acc": 0.6058103975535168, + "acc_stderr": 0.008546995661233635 + }, + "arc_easy": { + "acc": 0.5862794612794613, + "acc_stderr": 0.010105878530238132, + "acc_norm": 0.5168350168350169, + "acc_norm_stderr": 0.010253966261288895 + }, + "arc_challenge": { + "acc": 0.2713310580204778, + "acc_stderr": 0.012993807727545794, + "acc_norm": 0.30716723549488056, + "acc_norm_stderr": 0.013481034054980943 + }, + "sciq": { + "acc": 0.846, + "acc_stderr": 0.011419913065098704, + "acc_norm": 0.766, + "acc_norm_stderr": 0.01339490288966001 + }, + "piqa": { + "acc": 0.7421109902067464, + "acc_stderr": 0.01020695666205625, + "acc_norm": 0.7578890097932536, + "acc_norm_stderr": 0.009994371269104397 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_1.json b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_1.json new file mode 100644 index 0000000000000000000000000000000000000000..9c204fb86901a4f1348481c91fb089d5edd307e5 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.329, + "acc_stderr": 0.014865395385928367 + }, + "anli_r2": { + "acc": 0.346, + "acc_stderr": 0.01505026612756444 + }, + "anli_r3": { + "acc": 0.3433333333333333, + "acc_stderr": 0.01371263383046586 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.06737697508644648, + "f1": 0.33543417366946776 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932262 + }, + "hellaswag": { + "acc": 0.47699661422027484, + "acc_stderr": 0.004984497871025248, + "acc_norm": 0.6310495917147978, + "acc_norm_stderr": 0.004815343349305197 + }, + "rte": { + "acc": 0.5306859205776173, + "acc_stderr": 0.030039730592197816 + }, + "winogrande": { + "acc": 0.5927387529597474, + "acc_stderr": 0.013808654122417855 + }, + "storycloze_2016": { + "acc": 0.711918760021379, + "acc_stderr": 0.010472537019822583 + }, + "boolq": { + "acc": 0.5957186544342508, + "acc_stderr": 0.008583313811372065 + }, + "arc_easy": { + "acc": 0.6136363636363636, + "acc_stderr": 0.00999129677815962, + "acc_norm": 0.5765993265993266, + "acc_norm_stderr": 0.01013867100528905 + }, + "arc_challenge": { + "acc": 0.2815699658703072, + "acc_stderr": 0.013143376735009031, + "acc_norm": 0.30887372013651876, + "acc_norm_stderr": 0.013501770929344 + }, + "sciq": { + "acc": 0.881, + "acc_stderr": 0.010244215145336662, + "acc_norm": 0.859, + "acc_norm_stderr": 0.011010914595992448 + }, + "piqa": { + "acc": 0.7470076169749728, + "acc_stderr": 0.01014288869886246, + "acc_norm": 0.7551686615886833, + "acc_norm_stderr": 0.010032309105568802 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_1_lm-eval_global_step80108_2023-02-15-11-04-03_1shots_backup.json b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_1_lm-eval_global_step80108_2023-02-15-11-04-03_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..9c204fb86901a4f1348481c91fb089d5edd307e5 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_1_lm-eval_global_step80108_2023-02-15-11-04-03_1shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.329, + "acc_stderr": 0.014865395385928367 + }, + "anli_r2": { + "acc": 0.346, + "acc_stderr": 0.01505026612756444 + }, + "anli_r3": { + "acc": 0.3433333333333333, + "acc_stderr": 0.01371263383046586 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.06737697508644648, + "f1": 0.33543417366946776 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932262 + }, + "hellaswag": { + "acc": 0.47699661422027484, + "acc_stderr": 0.004984497871025248, + "acc_norm": 0.6310495917147978, + "acc_norm_stderr": 0.004815343349305197 + }, + "rte": { + "acc": 0.5306859205776173, + "acc_stderr": 0.030039730592197816 + }, + "winogrande": { + "acc": 0.5927387529597474, + "acc_stderr": 0.013808654122417855 + }, + "storycloze_2016": { + "acc": 0.711918760021379, + "acc_stderr": 0.010472537019822583 + }, + "boolq": { + "acc": 0.5957186544342508, + "acc_stderr": 0.008583313811372065 + }, + "arc_easy": { + "acc": 0.6136363636363636, + "acc_stderr": 0.00999129677815962, + "acc_norm": 0.5765993265993266, + "acc_norm_stderr": 0.01013867100528905 + }, + "arc_challenge": { + "acc": 0.2815699658703072, + "acc_stderr": 0.013143376735009031, + "acc_norm": 0.30887372013651876, + "acc_norm_stderr": 0.013501770929344 + }, + "sciq": { + "acc": 0.881, + "acc_stderr": 0.010244215145336662, + "acc_norm": 0.859, + "acc_norm_stderr": 0.011010914595992448 + }, + "piqa": { + "acc": 0.7470076169749728, + "acc_stderr": 0.01014288869886246, + "acc_norm": 0.7551686615886833, + "acc_norm_stderr": 0.010032309105568802 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_2.json b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_2.json new file mode 100644 index 0000000000000000000000000000000000000000..a0fe6746923f9316620b2f84affae1bde8b0c3b4 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.336, + "acc_stderr": 0.014944140233795023 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.014976758771620347 + }, + "anli_r3": { + "acc": 0.30916666666666665, + "acc_stderr": 0.013346684134591957 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.3117283950617284 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.47759410476000796, + "acc_stderr": 0.004984768912326932, + "acc_norm": 0.6331408086038638, + "acc_norm_stderr": 0.0048096267236268425 + }, + "rte": { + "acc": 0.5451263537906137, + "acc_stderr": 0.029973636495415255 + }, + "winogrande": { + "acc": 0.5951065509076559, + "acc_stderr": 0.013795927003124939 + }, + "storycloze_2016": { + "acc": 0.7199358631747729, + "acc_stderr": 0.01038376499392048 + }, + "boolq": { + "acc": 0.6131498470948012, + "acc_stderr": 0.008518188340844743 + }, + "arc_easy": { + "acc": 0.6224747474747475, + "acc_stderr": 0.009947227833469432, + "acc_norm": 0.601010101010101, + "acc_norm_stderr": 0.010048240683798743 + }, + "arc_challenge": { + "acc": 0.28754266211604096, + "acc_stderr": 0.01322671905626613, + "acc_norm": 0.31569965870307165, + "acc_norm_stderr": 0.013582571095815291 + }, + "sciq": { + "acc": 0.895, + "acc_stderr": 0.009698921026024964, + "acc_norm": 0.881, + "acc_norm_stderr": 0.010244215145336664 + }, + "piqa": { + "acc": 0.750816104461371, + "acc_stderr": 0.010091882770120214, + "acc_norm": 0.7600652883569097, + "acc_norm_stderr": 0.009963625892809545 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_2_lm-eval_global_step80108_2023-02-15-11-04-01_2shots_backup.json b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_2_lm-eval_global_step80108_2023-02-15-11-04-01_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..a0fe6746923f9316620b2f84affae1bde8b0c3b4 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_2_lm-eval_global_step80108_2023-02-15-11-04-01_2shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.336, + "acc_stderr": 0.014944140233795023 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.014976758771620347 + }, + "anli_r3": { + "acc": 0.30916666666666665, + "acc_stderr": 0.013346684134591957 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.3117283950617284 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.47759410476000796, + "acc_stderr": 0.004984768912326932, + "acc_norm": 0.6331408086038638, + "acc_norm_stderr": 0.0048096267236268425 + }, + "rte": { + "acc": 0.5451263537906137, + "acc_stderr": 0.029973636495415255 + }, + "winogrande": { + "acc": 0.5951065509076559, + "acc_stderr": 0.013795927003124939 + }, + "storycloze_2016": { + "acc": 0.7199358631747729, + "acc_stderr": 0.01038376499392048 + }, + "boolq": { + "acc": 0.6131498470948012, + "acc_stderr": 0.008518188340844743 + }, + "arc_easy": { + "acc": 0.6224747474747475, + "acc_stderr": 0.009947227833469432, + "acc_norm": 0.601010101010101, + "acc_norm_stderr": 0.010048240683798743 + }, + "arc_challenge": { + "acc": 0.28754266211604096, + "acc_stderr": 0.01322671905626613, + "acc_norm": 0.31569965870307165, + "acc_norm_stderr": 0.013582571095815291 + }, + "sciq": { + "acc": 0.895, + "acc_stderr": 0.009698921026024964, + "acc_norm": 0.881, + "acc_norm_stderr": 0.010244215145336664 + }, + "piqa": { + "acc": 0.750816104461371, + "acc_stderr": 0.010091882770120214, + "acc_norm": 0.7600652883569097, + "acc_norm_stderr": 0.009963625892809545 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_3.json b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_3.json new file mode 100644 index 0000000000000000000000000000000000000000..042d813d0855c313e4c26b99fb9e12f0bedf62eb --- /dev/null +++ b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.331, + "acc_stderr": 0.014888272588203933 + }, + "anli_r2": { + "acc": 0.313, + "acc_stderr": 0.014671272822977888 + }, + "anli_r3": { + "acc": 0.3433333333333333, + "acc_stderr": 0.01371263383046586 + }, + "cb": { + "acc": 0.35714285714285715, + "acc_stderr": 0.06460957383809218, + "f1": 0.26080246913580246 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.47769368651663013, + "acc_stderr": 0.004984813391016206, + "acc_norm": 0.6324437363075085, + "acc_norm_stderr": 0.004811543077792729 + }, + "rte": { + "acc": 0.5703971119133574, + "acc_stderr": 0.02979666882912467 + }, + "winogrande": { + "acc": 0.5777426992896606, + "acc_stderr": 0.013881582030658543 + }, + "storycloze_2016": { + "acc": 0.7231427044361304, + "acc_stderr": 0.01034711289027693 + }, + "boolq": { + "acc": 0.617125382262997, + "acc_stderr": 0.008501734385335954 + }, + "arc_easy": { + "acc": 0.6212121212121212, + "acc_stderr": 0.009953737656542037, + "acc_norm": 0.6153198653198653, + "acc_norm_stderr": 0.009983171707008999 + }, + "arc_challenge": { + "acc": 0.2841296928327645, + "acc_stderr": 0.013179442447653887, + "acc_norm": 0.3174061433447099, + "acc_norm_stderr": 0.01360223908803817 + }, + "sciq": { + "acc": 0.905, + "acc_stderr": 0.009276910103103306, + "acc_norm": 0.893, + "acc_norm_stderr": 0.009779910359847167 + }, + "piqa": { + "acc": 0.7464635473340587, + "acc_stderr": 0.010150090834551786, + "acc_norm": 0.7589771490750816, + "acc_norm_stderr": 0.009979042717267314 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_3_lm-eval_global_step80108_2023-02-15-11-04-03_3shots_backup.json b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_3_lm-eval_global_step80108_2023-02-15-11-04-03_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..042d813d0855c313e4c26b99fb9e12f0bedf62eb --- /dev/null +++ b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_3_lm-eval_global_step80108_2023-02-15-11-04-03_3shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.331, + "acc_stderr": 0.014888272588203933 + }, + "anli_r2": { + "acc": 0.313, + "acc_stderr": 0.014671272822977888 + }, + "anli_r3": { + "acc": 0.3433333333333333, + "acc_stderr": 0.01371263383046586 + }, + "cb": { + "acc": 0.35714285714285715, + "acc_stderr": 0.06460957383809218, + "f1": 0.26080246913580246 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.47769368651663013, + "acc_stderr": 0.004984813391016206, + "acc_norm": 0.6324437363075085, + "acc_norm_stderr": 0.004811543077792729 + }, + "rte": { + "acc": 0.5703971119133574, + "acc_stderr": 0.02979666882912467 + }, + "winogrande": { + "acc": 0.5777426992896606, + "acc_stderr": 0.013881582030658543 + }, + "storycloze_2016": { + "acc": 0.7231427044361304, + "acc_stderr": 0.01034711289027693 + }, + "boolq": { + "acc": 0.617125382262997, + "acc_stderr": 0.008501734385335954 + }, + "arc_easy": { + "acc": 0.6212121212121212, + "acc_stderr": 0.009953737656542037, + "acc_norm": 0.6153198653198653, + "acc_norm_stderr": 0.009983171707008999 + }, + "arc_challenge": { + "acc": 0.2841296928327645, + "acc_stderr": 0.013179442447653887, + "acc_norm": 0.3174061433447099, + "acc_norm_stderr": 0.01360223908803817 + }, + "sciq": { + "acc": 0.905, + "acc_stderr": 0.009276910103103306, + "acc_norm": 0.893, + "acc_norm_stderr": 0.009779910359847167 + }, + "piqa": { + "acc": 0.7464635473340587, + "acc_stderr": 0.010150090834551786, + "acc_norm": 0.7589771490750816, + "acc_norm_stderr": 0.009979042717267314 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_4.json b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_4.json new file mode 100644 index 0000000000000000000000000000000000000000..1cdb7f5459c0d00d99a81b214f70d0d272293da1 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.339, + "acc_stderr": 0.014976758771620335 + }, + "anli_r2": { + "acc": 0.342, + "acc_stderr": 0.01500870618212173 + }, + "anli_r3": { + "acc": 0.3333333333333333, + "acc_stderr": 0.0136139500102256 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.35582970488630866 + }, + "copa": { + "acc": 0.8, + "acc_stderr": 0.040201512610368445 + }, + "hellaswag": { + "acc": 0.4758016331408086, + "acc_stderr": 0.004983934343250461, + "acc_norm": 0.6377215694084843, + "acc_norm_stderr": 0.004796763521045232 + }, + "rte": { + "acc": 0.5342960288808665, + "acc_stderr": 0.030025579819366422 + }, + "winogrande": { + "acc": 0.5911602209944752, + "acc_stderr": 0.013816954295135688 + }, + "storycloze_2016": { + "acc": 0.7226082308925709, + "acc_stderr": 0.010353267472010775 + }, + "boolq": { + "acc": 0.6250764525993884, + "acc_stderr": 0.008467017704333002 + }, + "arc_easy": { + "acc": 0.6279461279461279, + "acc_stderr": 0.009918187193096466, + "acc_norm": 0.6132154882154882, + "acc_norm_stderr": 0.009993308355370965 + }, + "arc_challenge": { + "acc": 0.29692832764505117, + "acc_stderr": 0.013352025976725222, + "acc_norm": 0.33276450511945393, + "acc_norm_stderr": 0.013769863046192312 + }, + "sciq": { + "acc": 0.901, + "acc_stderr": 0.009449248027662744, + "acc_norm": 0.892, + "acc_norm_stderr": 0.009820001651345705 + }, + "piqa": { + "acc": 0.7464635473340587, + "acc_stderr": 0.010150090834551791, + "acc_norm": 0.7584330794341676, + "acc_norm_stderr": 0.009986718001804456 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_4_lm-eval_global_step80108_2023-02-15-11-04-02_4shots_backup.json b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_4_lm-eval_global_step80108_2023-02-15-11-04-02_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..1cdb7f5459c0d00d99a81b214f70d0d272293da1 --- /dev/null +++ b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_4_lm-eval_global_step80108_2023-02-15-11-04-02_4shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.339, + "acc_stderr": 0.014976758771620335 + }, + "anli_r2": { + "acc": 0.342, + "acc_stderr": 0.01500870618212173 + }, + "anli_r3": { + "acc": 0.3333333333333333, + "acc_stderr": 0.0136139500102256 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.35582970488630866 + }, + "copa": { + "acc": 0.8, + "acc_stderr": 0.040201512610368445 + }, + "hellaswag": { + "acc": 0.4758016331408086, + "acc_stderr": 0.004983934343250461, + "acc_norm": 0.6377215694084843, + "acc_norm_stderr": 0.004796763521045232 + }, + "rte": { + "acc": 0.5342960288808665, + "acc_stderr": 0.030025579819366422 + }, + "winogrande": { + "acc": 0.5911602209944752, + "acc_stderr": 0.013816954295135688 + }, + "storycloze_2016": { + "acc": 0.7226082308925709, + "acc_stderr": 0.010353267472010775 + }, + "boolq": { + "acc": 0.6250764525993884, + "acc_stderr": 0.008467017704333002 + }, + "arc_easy": { + "acc": 0.6279461279461279, + "acc_stderr": 0.009918187193096466, + "acc_norm": 0.6132154882154882, + "acc_norm_stderr": 0.009993308355370965 + }, + "arc_challenge": { + "acc": 0.29692832764505117, + "acc_stderr": 0.013352025976725222, + "acc_norm": 0.33276450511945393, + "acc_norm_stderr": 0.013769863046192312 + }, + "sciq": { + "acc": 0.901, + "acc_stderr": 0.009449248027662744, + "acc_norm": 0.892, + "acc_norm_stderr": 0.009820001651345705 + }, + "piqa": { + "acc": 0.7464635473340587, + "acc_stderr": 0.010150090834551791, + "acc_norm": 0.7584330794341676, + "acc_norm_stderr": 0.009986718001804456 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_5.json b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_5.json new file mode 100644 index 0000000000000000000000000000000000000000..8716e16bc79e9fff0c05fdec9a73939f46f9fbdd --- /dev/null +++ b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.346, + "acc_stderr": 0.015050266127564441 + }, + "anli_r2": { + "acc": 0.336, + "acc_stderr": 0.014944140233795027 + }, + "anli_r3": { + "acc": 0.32166666666666666, + "acc_stderr": 0.01349009528298952 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.2872985170857511 + }, + "copa": { + "acc": 0.81, + "acc_stderr": 0.03942772444036623 + }, + "hellaswag": { + "acc": 0.476000796654053, + "acc_stderr": 0.0049840302505072915, + "acc_norm": 0.6396136227843059, + "acc_norm_stderr": 0.004791313101877042 + }, + "rte": { + "acc": 0.51985559566787, + "acc_stderr": 0.030072723167317177 + }, + "winogrande": { + "acc": 0.5887924230465666, + "acc_stderr": 0.013829128358676862 + }, + "storycloze_2016": { + "acc": 0.7268840192410476, + "acc_stderr": 0.010303512765124681 + }, + "boolq": { + "acc": 0.6238532110091743, + "acc_stderr": 0.008472516562330721 + }, + "arc_easy": { + "acc": 0.6338383838383839, + "acc_stderr": 0.009885391390947724, + "acc_norm": 0.6199494949494949, + "acc_norm_stderr": 0.009960175831493126 + }, + "arc_challenge": { + "acc": 0.29948805460750855, + "acc_stderr": 0.01338502163731357, + "acc_norm": 0.3216723549488055, + "acc_norm_stderr": 0.013650488084494164 + }, + "sciq": { + "acc": 0.909, + "acc_stderr": 0.009099549538400236, + "acc_norm": 0.901, + "acc_norm_stderr": 0.009449248027662734 + }, + "piqa": { + "acc": 0.7480957562568009, + "acc_stderr": 0.010128421335088683, + "acc_norm": 0.7568008705114254, + "acc_norm_stderr": 0.010009611953858917 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_5_lm-eval_global_step80108_2023-02-15-11-04-03_5shots_backup.json b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_5_lm-eval_global_step80108_2023-02-15-11-04-03_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..8716e16bc79e9fff0c05fdec9a73939f46f9fbdd --- /dev/null +++ b/4b284b28bc4seed1/evaluation/rankeval/4b284b28bc4seed1_5_lm-eval_global_step80108_2023-02-15-11-04-03_5shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.346, + "acc_stderr": 0.015050266127564441 + }, + "anli_r2": { + "acc": 0.336, + "acc_stderr": 0.014944140233795027 + }, + "anli_r3": { + "acc": 0.32166666666666666, + "acc_stderr": 0.01349009528298952 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.2872985170857511 + }, + "copa": { + "acc": 0.81, + "acc_stderr": 0.03942772444036623 + }, + "hellaswag": { + "acc": 0.476000796654053, + "acc_stderr": 0.0049840302505072915, + "acc_norm": 0.6396136227843059, + "acc_norm_stderr": 0.004791313101877042 + }, + "rte": { + "acc": 0.51985559566787, + "acc_stderr": 0.030072723167317177 + }, + "winogrande": { + "acc": 0.5887924230465666, + "acc_stderr": 0.013829128358676862 + }, + "storycloze_2016": { + "acc": 0.7268840192410476, + "acc_stderr": 0.010303512765124681 + }, + "boolq": { + "acc": 0.6238532110091743, + "acc_stderr": 0.008472516562330721 + }, + "arc_easy": { + "acc": 0.6338383838383839, + "acc_stderr": 0.009885391390947724, + "acc_norm": 0.6199494949494949, + "acc_norm_stderr": 0.009960175831493126 + }, + "arc_challenge": { + "acc": 0.29948805460750855, + "acc_stderr": 0.01338502163731357, + "acc_norm": 0.3216723549488055, + "acc_norm_stderr": 0.013650488084494164 + }, + "sciq": { + "acc": 0.909, + "acc_stderr": 0.009099549538400236, + "acc_norm": 0.901, + "acc_norm_stderr": 0.009449248027662734 + }, + "piqa": { + "acc": 0.7480957562568009, + "acc_stderr": 0.010128421335088683, + "acc_norm": 0.7568008705114254, + "acc_norm_stderr": 0.010009611953858917 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ad011fbbc1fba83cb41fe67646f44359f5abc94 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b016bf217a460371476b5d3385b61812935c0efeaddce70298f1decf48b2b247 +size 199058647 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1a62f6bfae853750696e879941aaaadc856b5b6 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39a4eca43a0080b234df9aed7d0a22e04b52bcdf22db22d64f7deaa054c01246 +size 199058647 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcc2502a63a09a99780f1d010b54f9e9087064ee --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9dac50c2a6b46e67a11e023c1ed65962543aa73f953c7c198e905bba6059a31 +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..860ea0b0bdc90d50c2af34df612f4b1b78c3f872 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92db120f2a8f05cf41b7e576f5591fa20a620acd9b797cdc01ebe1abbeff7d7c +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2203344542027ad1d107f5a7af129bdb745f9368 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3dec40345f1c8496b4f74feb32fdd28fa3d92030e668e46593eac455052f0c5 +size 199058797 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c53056749552659439c053c6164d5311032cd6ed --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67b4539766cb90ebd9c36b117e12cce01aef1c23b1348c43a5f7caa0a822bdb0 +size 199058797 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0424e5d07936e91bd7252652d1f85933d806e7f4 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5395e8c95565eb004db3f475ec967c9b0c5e82ee217f58f7ebadf20a46b8ddcb +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22c82da3d7ffb5221efe863358b6bee7f442754f --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe42ffff6d5c60e90a502cb6d14895e9afe8fa59fbac725bb12402cc200aaeac +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc87440b02218eed75ce952e9120d8333f317e0b --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf628e01be9066dd88892a89e03fd6705430b6d93d08e1d29982243d1f5dea45 +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..108dd099ee84782d385d3b74f80b894ee864b83a --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19564b40d519bcf55cffcb4e182527688ccd7ee782654d76af5f0367d0223041 +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6d314855b882443615960dafcc497e9ad89556a --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d957e4104c4aa006c07512589b265805e5bca5d12d52bd8360e202f7082b274 +size 199058797 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7076a4b07e178d20ee7cc5a1a81225e8d361f268 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d028ace4bc2a149c2ae2cf21c888ab6cff7d481db9692816a13148ee8ec17e +size 199058797 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f2edb2494caf306cde3e0184cd710cd0a07007d --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b0cbfeb357ace31cfb60f9d85f8128248b5c70ae99dfe19bda906a41138ba93 +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd3bf876906f15a21d91f7f08502567a0bc58bc1 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:748f0a9d77d71635439d4dc5a307971b8249a5af6b7f75c80768b071b84f5074 +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da2ec102c506fb179e3816579320334a2689b0db --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faa7bd7f475fcdce33467347a9141655710e069b35519d1afc793769fd62269b +size 199058669 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f49dcf0294352eed163f4ea6ae0fe3d5db5e5b36 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f42a5fa147192c2573b19fc21865f521f1cb33c56abd32d9749c7cb0d4e5b74 +size 199058669 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fde4e15e7816b4e4699d3d92c1752be24183b952 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f07ca7709a3afd760f684fd6a3d6ed1ac4544e2ac3c3213b909d55ca133212b +size 199058797 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dce75f9f56430d096f31ea41fff19a1446db3114 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c9d2391f993fd9b51640be83bbb80d375353c25e2fabfc4175d64be96894e93 +size 199058797 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05b917a9ced3f16a6c69626dd289f41c198d635c --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e50ebc37ad6f605616d11dcda9ddb940fa87297ce68a789ab19767fead5a05 +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e879e0fc21ef36cdfe920d5b25adcaafb6b4423 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:481adfe977330a88ef5f1e902c4bbfe92ba7c87375cd831fcf390b8127dc628e +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97955480acd3bde99bc4c9271122f70b13209fcb --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a04f13d9f240814c9310725e7f6e89187da58d772caa2176f06353fe3af07270 +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c90f0bf1e40640e74fc8578a006139ed62e6da7 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:525f36de1c943264231d40e8b0b6e0cd6fda108b06b104a5c75be806b8459739 +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e41e941c0c009deaeaace8643f7a0a1c6988b5c --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7a8b70c63cad22f3921109ae8ad0faba39b10cc5dc6ab685775410bd8d5cc76 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9901c503e4de420916f34339ef1097999a19ee7e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76ef770314636e8688ae77c31371e4dd3a21656eeaf7b76c1f78893df1a52247 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..742c48b8ed5deef5cf5bd30237f730786c390ca8 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65a6bc81d57296b391080305946a77c5332e9570499400682ea07ef1de9a840d +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1755e4f7e66762a268bcf3cfb3c6248813910bbc --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd114c66d9ca414752b84d130270579acf7ac5d5c196e279b2a1a5cc7b44cc3f +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38b41b1ddd5d8209ab303d67b4a1c29087fd6ef1 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:201021eeed4b34cb20bc86677420b528d2eded3e42c6d47609d8b75177684e92 +size 199058797 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eadc617177d782aaa0fe234c8a315a58cdefc428 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95127b822dcae8fe74f25f6035775675e73fa88eec1aad28c620647aab2a478e +size 199058797 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a15e2fa7b84d3e6ea0a048e49feb732f766193f8 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bae2083a81c85b4cfd6d62c89f63171c3c1152bb3cd65c871f680c13372d4e5d +size 199058605 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2136b363b5822f5b91fd696b6a4e223e7b9727d2 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4051f63dea4dc51ccd8340731074e331b75ce49f5b3105ad3dfa545ee4e54eaf +size 199058605 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46d7c6d467aa52b5995a453a46020f76d0d58333 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cd1d4f60e91bde925dd9fef4b52f06d5b7054cfa4552f760c2a240b76a7ea2a +size 199058669 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc1ee5a2617dd9fb7c9216bf75883d04a89ea793 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2111c8db964c10eed03d692fdd54084e9a4d77467ef3be3d224a733638b8f82 +size 199058669 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c7699261d55537efad3657d1760ec80ba9791cf --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c647179677825f39dbb49527727e575c82922627f48c8ab9d22e0048681ce452 +size 199058797 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f11ed86a966913c41573aaec49f887f45f90c45a --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5959ad55038ff457d6a9020b7c857bedeea86fe5fa969377a95b119379c9f2cb +size 199058797 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c16c58a832faf786e932af15fad7faa6e9befb2 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaa3338dd5b90c06ec4978e506e520cbf1adf54f70409937fc01f0bd95f11f04 +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f92102958fee85c15f2c32ba748a06653f0d942 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:525a8a730c850b3a4d31cae318c74ca5aaab4c5b27aadcf61262e9a5dfb045dd +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21dd36dd5c4f2129e33e316afe2294ed3ca92f74 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7abcfd3c00f37851da5e545019e3cb200173ca1b8ebe45d6602cf69138bca792 +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b84bc5b550d307c3e792e0c5037b356c966284a2 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d00b09704d1ec9359565500f775c8e91e28dde5cab79d6c68bbbf9adc36ea77 +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7c33c3c0521070891c5149f42802522fe11f805 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:128bc9412fa45fce060f4a5892f9ffee5c1df50b8c73b975a8ee5393ca9b5b2c +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d2b397ba064cb13eec834c794862c6ac541f0b8 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65e76801b205f8178d7f5d93b039d1f95b4f23a5767e42a4d5cd315407821feb +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd8acdf62d9196b05c5870198c7f958bb44d910b --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbbce38eeb06944af097342e182246ebadd9d314fddfac22d95ea259382e04b6 +size 199058797 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0e19e4350f17cfd1119beba3f212557ccfbad16 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02b1e07f0634de041267e805458b5f923197001a5ad89d15da85889bc8703937 +size 199058797 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9af039cdea9c38947e5d2971f6ebee01b3c38371 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d4d126d184021dc8475a9e50f2b11442ccc696fa56bd073c3b959aa620ed183 +size 199058669 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9652489f2eaf30937f8c15409882c78bfc735c1 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e07f342df929d10a2ec99213dbef1d0289c87e9a56ad878a07486da7be2cc06e +size 199058669 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fa9a5f30f60db15ed0d421cd8534c8c7b4dabf5 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89a3f944d7f595a6aad5b92e4b23144c1aac73fe64b21f51fc2d7752e599d8bc +size 199058850 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c7297280162d38bc78c7fb287ffcd3e9bea2709 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30bf806e1e3e1ebe2bef17224b57f783d437606db83052dc52fcdc3a8eec8d50 +size 199058850 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b6c5544f1a7d2dd8b4dcb637e2743056ae53cc8 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9a460d67fa26a5fb2738d2ba05684fb5098973c76797fb1dc1cbf3dceacdd7f +size 199058669 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65bb82cdf275189e39ad8f853b1b9a6fe78b2a96 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b77edebd9a05f3e960402d60783e162daeb3d29c22c274ae74f0a5a4e1f29141 +size 199058669 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c345ff7de29ba959707fdf49be65fc8788ddeda1 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2444d1c5633be070e633e23cb2d3d59479b1c2f7c83eb74cdc9432827c164f57 +size 199058797 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b35a66abd5434fd86d0d5578ea5347df06e03f46 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e18cc90f279f98869180d8603e8fe8334e47d67efdd76a7f0941679a51813df +size 199058797 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf8ec6f2ced5063f268c3178d09edf3539f666a4 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2857b6ce9596c3e0b707d8c5b5efec2a121f4193cd5fd4cc1c308f169824e92d +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3031b8f37f44f81898b54d7ba4a74ea27a810e52 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11d9f0bffe04acdec9b32489e15d353c68824d3edda042d91c757a292e581cc8 +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a8f8d1c80a30539038b3fd7c2b2ea3d32b91653 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55d10cc651665c3dbb7f7b6edec848313feec15d231cd2b7c1f3d4f7271605bd +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa2d531b4001ba11e006c356767907ac136bdb9b --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68a3c16a55b00642b073efc66b016a1d7cc755af9855bdc41b2c77daf9dc3b53 +size 199058733 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5ebab9a2218e007e259aee57f07ca6f85df925f --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d32dcd249e128b640072971fd26f33707c145ef551c38b670c3ea72a1682ad98 +size 199058669 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b792a8928f8aea92844ebcd8a4b75cdde5b5e80 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3d26154eb393978c84022f2ea989d1914874a554816f0176b38d8672b29d785 +size 199058669 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74131e646f02438e25270db169a1251b8f01a427 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2de3ff6783a9d371c61e0368fc21c0da8c3d19ad5a08df065c42f7dd1b10f0ed +size 199058925 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fe62a510132c4838ff6104af74ac1beed4b3e5b --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eed669ad166d876b4bf1bfc61ed52a55d6d63895794cdcd9d07d93d85e3bed72 +size 199058925 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14cf684ec3a43051f2ec7a095692a6b403eeb2cd --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e0feda2986e218537dc1063aa9a6869afa7b1a44debffe275868b662ce5b8f +size 199058605 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1939dbaafa7c2038959985a01f0cac837848a61 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d5d3cf3f9977011b947ac7399a8d84dbf7b41d9f464b21a870a209404a80a90 +size 199058605 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c82a59da273bd1989f070d2af1ece44f25036b26 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04427080bb07f98a187185f23be75d4b6bf71e0b38dd2edcf76ce6d71ff41be +size 199058605 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..072142a4580cf9fc9d4feb9e25a5bc8e225ced4c --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65ef58773702dc2fd5283e8c00e0084b8424ef5e84a97e4469aa23794db6044b +size 199058605 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..def95efcefee48879950c9e37bdf44b0ec00d110 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66040d1f57a69a3d3fbcef85ea2126155c80b991023de67e89974c5279c7df0b +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..932edf0b48c93014e9e2a74f274fe01cea902f62 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e04934248f5617566b4410a8622bbab541484fe5fb962e77b1198865d0299ffa +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12c3248e89c2d1c74aa1f04fd451f6313f21b113 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aef490d057820f07af3f70b16109951f1c7b6a87eb67a224e4da1496bd078ea +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb962de6f195a9139c0fa4e8451279ef3194c395 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b634e9dc1f59dfbc3b60301796d8d8e85a259e399ff3af30618069026b72ccc4 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..338ccc9e7f5af50b868c166cefd5164727f62ba2 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0303603cf82447d04df9ada8753ca0b1f4ae28304ea973812c961ed45736d5ff +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3c536e3343931efdd015de623cc990cda8520b6 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b96a4dedd3a380e1287df19ade12445d532c635c2752e35b12b42a71dcec13a9 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dade33ec9d573db8deb0f35f670343d2bd8b58ca --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd29350e36d382f4a3d4ce65ac7babc84a9739d8bcc29d0497a3bd88dcc38983 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd6a653c68635b033d760f7ba4121746cc6747fa --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d009f2a2d9a8490ae059e723f121e60b95a954b4a12ffafc5af4d2aca598dcfb +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01b2042b2b516270e9385ece2fa6993a412fe05a --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:161e4755b0e27fa89f1505559072812fc356a84839461b7c3325953435c1e212 +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..565f929b6072391dc20698d180038b5ff308e8be --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58483cb4416d11188e09138692d0228aa83f90d2eb0ebdbb1b3a4e1382240e42 +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01c92f4fc6fbc23da5cf90e16454335ed848df6b --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d19c3fc9b45d98371ebb1c7e554e2a94059bb7a6935541d439c9267ad12e86b +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b51eeb92a35bb0630777a18bd54779f06e04387c --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b32ee55b2c6d505e34e1e812a033727d2e7d9c6df438be1904039ceab0cc80dd +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b848ed336d68af57b749e37be9f721b84181f39 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:723a4001706f99bd4caa92d0c75019a1ed0c4f5aba83e47d8c2c0d9aa6fa67b4 +size 199058978 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..473580709fbef75b66d9457326fa07a19bbaf046 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e870ea2a80670c046b92a793041fec0536973ffced12e7367162834d33d614e +size 199058978 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac2e11a69a7c86d63ccacdc175085c91c8c44822 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f4092754ad686655332457a9cc770c185d16b9980453bef2a8c4d4e56c86461 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3103f8dfc229556903f38179b02b110c19071805 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8021bff24902a10c231e78411ed6277f587b61a6e3314cba7fbf86bdbf37a6e2 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f1b0c5fd2cb56ea5d18e188f47f0dd8caf74cba --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cef22b5df7dda966fc0f706f5ebae46cbbf5eb8e86e329aa97d854834d43978 +size 199058647 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44a17993f89418293dacbf68fae50aa028531060 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e2d6f733bbed1dcbeb03e49e7817f8b9099df8680a2996a7a32f4307852540b +size 199058647 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..942281d2888c9f471e0c383aa2d1f01405b8dbfd --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e508c040bfa7840d57ee7c227bea1b35c048e67b7a57d587ca578e38c6092b5 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc7d0f334c7283ffdcc0e448232439cabaea053b --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b01c647378dbccfca4f25cf8d841bdcbe29320d18df41590a925fd488deb4fd4 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f53f8e033d138dc22eec43020eddc24bffe26082 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29d86ea67984c8c1de2892cc98fa1c4006072be5f7184f93d562af99eb050951 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2950d3beefefef48162953da70340bcaef0d575c --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c54f4da1417f9244d4aa54a073dcfdeeda619767e15658f56f566568f7feaf58 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..867af7642a4e04ca48ed8974638d6a7f2456a55c --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcf07e32b659de785fab4e308ab8ef29e29f9bdf6deb7594448e282494748586 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33e9cc52f48d2159d1414cd1b51b18162df68e3e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f19e4479b130ae733ad1f35987d086791aadd2fc9602109cd3886938e1e3e903 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09ed89db648bff2eb1c1e621f448805c94f32961 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37ec6cb43760fb93704cebf45dc0c177ad5e33856ce5302d06fac23db4899d29 +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c72d99ed177757137703c598ab7c4c38d0d5d1dd --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:268cefc2e8599cd85e885ff2f542a3c203e4e96303cef05dbd0c3c0b5afd681c +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4279d1d0e06abb2d73eedbda02eb608aba13d59e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fa6b54e7efbc9ffaeaa7f221d1e6e5973d387368c7d8f22ef3ce573b9eda8d2 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..abbd204400c7ddebb1cc15acd5460487dd7a0fae --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5a25430dccf75d2217e7b2d5a4d4455b7770e03bb4a5085ed0f2afd857060c4 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b541d5c9ddac61cb2cca0b0ef13ca5d8d1e94e2 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51e2bc42424d5f70fe3cc6e9cddd5f4e725458acb26d63033220ecee1f05d981 +size 199058850 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a70f9631d7f8fea73c86b4d62e1e55a1bfc99a8 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cdd79b2374004f6936eb48f8ed7d37be5606b7b2265c592c1533a95b8f53290 +size 199058850 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02f5d303cb6f42e5700c6b8818599fc34dfdf850 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14197903cda9988c021e96c8663c77ce0a57d42cd3c1918a27328c61c7f3c0fb +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a38ee438eb29e5a3c7b6417113daee3f8ece63d1 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c791f6bdf46a55f17fac424c6714c46448ddddafa92f2d38c9d83100eeb3a093 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f40e85aa68d660bdb0d55ea9bcc7669e96c7f8f9 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72bd8efd757d5b6dda281990201ccccc1eaa14683b96804234f26af7e6f12d62 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca5fdf77e8619c2c95366c51631ea58798465f70 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f8d67af19bae79cad83d851a10a651a4537d4e7834955844cca90b06bbebdea +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c045d2088a9f29572ee2e1bd8e9abf314396611 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:932f784e6b5ad4e2f2ec7f8e6f5f0964d3a32eda540bd00e3929127cf759e384 +size 199058594 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b77eacebfc9603bec973674a3846bd265a32e27d --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4fb801a59bcb58ccf8896560595a4d7ffce0cc33b4de1bef296fd0134ea4083 +size 199058594 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dbbf3f4d5f6b26257a93a14c636e6ee6f13c137 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8170b6c5e96c16af7e9e4e607d2ed842711d7d22d89724b4574ccab4ade592f0 +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bd3a61a77c6f478141b11d10ae607f356c4974f --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c9d88b9254536f33b3608b43b6d963f92f57cb6c0de562b733c5e9733071329 +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d57878795dcfd8e8e97ff929d9323211f41779b2 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ea89f9f88b9eee6d86638ca304fe9d2ee5f741fff69f035878571d2f58e984d +size 199058711 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb17c1e86b9f9cd270a8fb281cbf41d8f74f96f2 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0756e9c25d7fd194031814549f74279178f3357d7516124b9f3e6240cc9933b +size 199058711 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11ad1871e8d1bfcf903fd72d4b7b93ff395500ac --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2ef59770baafea74f844b93bc65b1156ee0fc4f802cf3fed2221e0b17ac22cc +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f2873574075ceea7c4734730ec18307f68e2f1a --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39376ff95523bc7ac03c233e9d597a87c21cbc1f1b740454fcd3a54411cdf2aa +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a106e492bd00d1233672fefb1e921c487fdb550 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2373897b95e00976411b8817befc14f992259a2924fd8b2e2c60e1ba1563f864 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2f9e542ee2ca7ceb7d4748459594db891836e21 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcc71ce180096df755fec9830f18268fb6ff8626140063fd779779774c8b1b98 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..087ccab042e4c7d6b617d12ecfc3368525900b81 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1552f080bc20e53be7445ed7d0f1f318eb182d0f9f29c12eebd0e71ae533869d +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a27bccb70bb64c9bf32cc2dafb7ff56a8000164 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0aa6872614dc43149f9037053839a6fa1ff4c8d74a14ef38888a92859a0b484 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9ab383b84c53aed3e690e8899d813990879888c --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df03aee58b86d118de6f1fca15034084bc4592ed512d809790e021a6af75f0d1 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57843864a5fca82030b71ad67f73bc0f1a548bba --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0990e99ff8e4651a8da0cd1bd81ae794f2d28fef1c1da7612dd6481da82c2fc +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbc3bc9a821f0a0a9e72f98124ef216031613bf6 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efe8fdab02b8d1d60684ed4fe3765fa798302d90ba2a9b85e3e0564192510c84 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f19df4c1cbe8182912ab86928d33b472441e64be --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0152c4cd488cee586792b5b0012163839de2ff1b26a12d4f6d2d56921ff2ed11 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98f59f8fef2d4f023b2a88fb669a4d98b636806f --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d31b51efe6933ae8bfd291700ec422446b9fa020916bf9b6afd385a23d77ef7 +size 199058594 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30504a1ea650b228c07627603f60bf8051f5a6df --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63a763dfd129340f162f31b8135016e6916b860625543813c27e4b4e048d03f7 +size 199058594 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bca5350f7ba5c4cc6510011cec34bb57c6cb2eaf --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80e9113f0e331ca33ca2ffd78175dfe8f067c405af507a93202bcd2cf3724d56 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c35f6a1b0839097fe5939393ef3e99a13a94479 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57a9503798352adee8e28b847ec3fca1edcb60e474a36bff8718e6969aca554f +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8743e347ed57e9dbf471ca7bb9e5ab104cbf5ce --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b7d40337fb6b0f5f67f591415060ddd906a2eb688e2e43f2489b38656f93b5d +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79c2fe2d000f6a9b9f29091c23535aac68d61c7b --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06f736b9a9cc09ae102d1e822b2fb5541c2188b4dca1829a42a3e0113c1190b6 +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a974c3e3eb67ee279f87ef95bbcd4383193a819e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66cc03c193e14269b6132f543930747348306372ab4761f34be5a1584ecceea5 +size 199058850 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..627624aae050aa7dc74c8ddaa231654b6bdc792d --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6907ef815032311fcd65696ab6f8034c7c13d8ce9255fc6fe9e45550d3fd2aad +size 199058850 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e596f9d8940ce52c77274f976ab5a7a6094758b --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df441f0e81f7c78534e5ec2e8b34edc7df6b4e8521ebfa1eb7bfd65cc0f5cfff +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67503036d1ea29d1dd611bae5381a6126a4225f3 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5ddb987a391b7398393106b33e4b113e5a065d4752381a12aecf7a148516ae7 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f6b6671513859baafb3ab848a6b0a9e14321fa0 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99c47f1678ec5d44d936e03cbffad452a99d186aacd2bef6561266ab73238091 +size 199058647 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..737a4ea3121993ca9ca067b3f307cb6ac0c8a537 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c479b38a3b29c56d287e5f29f45a5f6b12d09be1ea2b45018eadd9e9c35be0ab +size 199058647 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b98f978e1863dc9d13830f2672a6309b3e1d06f --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93512fca3776802e4649705f67eef1cee40ddcf30e76a5f22df500c69dbe7e51 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b5ec2ff36f9bc1201f625887c8c0ad8b3bec820 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f208e708edcf9db395a4f2cf12df652eadb76ada16fb370c93a17ca24e82e5d +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3790f43af6e35380b3f11f5ad5a12de9fdba6cfe --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d9a46471ac55f15073d6df5ed493a758dba0f49ef13817e5d679703166dcb2a +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0622dccf910ce4ca22544f40717d2a532eeb2701 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d0a7d509c9a9b6f474315c46149fae1a39a36946179878ce99398129ec23f8e +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2a7b851b4c20fa5982d6cfc90afb7bdabef33a1 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61b926f883579392cef9aab482e88df73fec1a9478ad59c4946aea90798525bf +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dce8489e4750279ac0c20588188d108c5d63c9d7 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1bbea8d0dac0935d26d6d95fdbcae7b84d7a2feaa107ef9b0eef9a6ab40e7dc +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..582789163bab90efa8d518b2a97117de59ba0f42 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afe6e576d7ff5f2cf2062382fc085bbf450281fa5613ef0019ec7288391b7357 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd8994124d45011ffb628107cf9d0d3cec05c26e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a55897bb4301ae054ac42860a0833c4b6edcfaa7ae5450de7fccd0dc237c469 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51ca397e12c6b326a26d2369e8f0d3d2392e2442 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57ea49b1a99f67431d171ede86f90db6a5e6cb6b90c5872591d450a4f02459a4 +size 199058850 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dac0808c09a02a2ed208d3f25615862100a9332 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:384d3afca264dc24ebe93cdb083ddc6ad07ddc7a4eb6bb541abf1a55966b84de +size 199058850 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43ad66f94d790356cc6dc651ec157c3d077be8fc --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09fe5d50b32c6df434ca0382685676e4002b55fcca99de218c9f4d9f82826251 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94f1b9b0adc675f4140375089872fe727fe63c5a --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:648585a0beac083926f695462b2a3371c5d623ab58cdb98556942479d7742ccb +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54f7bd68739489c93e5a2360c899c3783c225b41 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c7d5e3c81d8f64b8025460647e4f5521488455d5740c55d26a6bfb4079c3cef +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45a5d60a27c6c16738ea018ac5ad4f5886714d83 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d061dc8f713e0ff2322908b4bb307f1f63b72d3d146d0d86394ea7d33380f89a +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ebda0671d09d29bbe580126c496aaf9fd1841ea --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a06032f3d84ca2e71387fc21ad41f3119493ee0105494eaea9bd7889d62abf19 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67f9f097279059f1c779ce9ddda4775c58506c34 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9994d84befdc696ef8426149839492a8a368398d389b08252d5abc4d08376ea +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de5ddbef76695948910eb3a8bf2b6d9224232f54 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b35484d9ce7ed7ceb4be729f37ba21459b818a1fa08a719523c05574d1cb1bb8 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fbba96f5aabf0f11021f00978fab572ae7fc22b --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9903c6181b430625373b6c8e31a7b1ff163bbd62ecb8364b055ef3aa8a28318d +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..447ff1f9b11dbe1e6a42ff23e169454e8e708d3e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce017ca00df34a997046cecc99039b431996e446ff9e32f7419e13a739a4bdbb +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9593c774e7b672a447b44eb1546cdb5e3937292d --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7be87c4ac5c0d54a916e1582c31725eec7b6d7a10e53ab70a072b149139d659 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef40f868af751f79754fec0ac1b9139dcd033c97 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9ad58aa62853750d68c502f9005e1d6e2a2dbbffd32b160b624ebb49f59e295 +size 199058775 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1836f8e32cfd5762e7ef4c06668405db20e1fc84 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97072c807062c16f474d9a72f0003c31c11b3e2c7bfa4cfcf15eb7e1a083a3ab +size 199058775 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..474a73fff89db50f2497016f2d3f8e805ca81449 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66fe7345a40301e523404d26e29e2a7a5f96b8624812f5e12647fd5b20a442b8 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41b8be0d9b9cf095e6fcfb3ad867344b3fb5d9fc --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f1d39a94611f202fd0a7c49846a76555ed839b90787c5691d8e187a47d17e9d +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f381f46f7847837bb570f03441b47adf39a14dd --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6f23effcf41039ee8f89d3c72f715f2b3c526a1c3ea9796818bd65f34f49c68 +size 199058850 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..619e06dc9fbb1d3810795e60fb790354511a01fd --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7838992b463069520b8ca165b7e6295555ae77f405468a2710e08079d16c633f +size 199058850 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf804d59af04108ae04013f5e471f89e966d5505 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7f3a86d7358679349d9d47996abacb83dc54bf46c162b090e20900813fd1ea9 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e60cef51ba2c6d73013be1739f5adaffe1a562e8 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:065cbd492c7e449d83db2fe2ca5d909fe9684c065a5192cabb1ea667837c34df +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20c31d782411ed3817cdd8a1bb9e83082616e241 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bb006f5eefb41115ecafeca413c5d748b3643550824155a6856771b970707e3 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7af099b53ef2f3a82669f646c16907fe6739a45b --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c2001c3fc941123fa12d1692cfd0534a1c33fb706bc10c419a011c87dcc43b3 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61c52167e48df41453828780f85fbc15eee63502 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fced8ecd23db1617bf77683742ec08432d90bc2d9ad377d034928a252970c542 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..462eb691a964869cecd7833f248513b49873c780 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f1c0c044a2848a5a4a901382003a92c9f379b7c05782ae833dcb16f22e38e80 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c37eca9f8b8a2197b3c30d5430bc6ae3929096d --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:222901d100ccee97bb17cf4bbeb552e46cf35c3cef646b6a16ee83d896f1485f +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f808310e77eb2695910f0e195c64721e42ed8591 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbc232afec5036d3ed09e2c05ecb3036982724d2abca60595d28870647a22bae +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6f257ea922174eb6788a3cf9088d8a1d9f9b190 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d96a04dd89b603cde83a7df9d48c734a8f4cd7437e9a9739619cda10130278be +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..acb0a0686d757ed67bca863440283ee04a0d1e7f --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:551360a578cd1ddde5edcfe1f413f6bb676a487e287fbf782b32f542aaf45dbc +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a41b5daefcada2232f704a416c41ae9f34dd79e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77a58cc084cd3c52ac17d87a09d7deab15db3eb8d0bb73a8af4625610f981239 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8613efd955cd836df99423d313d0d71c79e67999 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f96dfe928bf7b1deb661ff35cc39cb666ab7b32c88e15efa5a15ccdf974f3880 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54821b283054e5eea3a4a2a74ade96ac6c2cf738 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:583dae554ef074fcdb62dc4af389fd3e211072cccb13245dcb217fc6a0f00535 +size 199058914 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31bffa3cde3686b859e2db311b1d3af22ea9200d --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c31663a6afaafe8f07dcb85e8b1d09e385c0248677a25d8ef7336ed0fe8328cf +size 199058914 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a64c6cbc82a6503260756ec3a5c9b584784cd53e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9247f80c8b473c57f9a4d8c077fccec2526294e4f2b01de596c93597a958e8dc +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69c13f0d3893d70b5b07d5a3f806357bec8a6e9a --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abc878dde1828429662047bc467d63cfc55893505c0e713d7d843329e4aac206 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76a2ebd2f1965b61130af5fd6956522e9cd6b4ba --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd22db455d25fa02b2a3dc33854621e6694baba0b02880ca282190b158a1937f +size 199058711 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14436e4798aa035541dd252d91dfe4cb7fafeba8 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1849b64cc4d2ff34d8ae1800647ff06edabd0ff29c9677232b92a39c8f770fc +size 199058711 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e0f42a1afc0d10f539a9ef5914038432d26f746 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2502f671208b64ebb855d08e5aa5fa1ae5a3f96801038877fc6061383c1f2ea +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44709c5258856138bb0103a6b0cada4e7ac159ca --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f24d3363a125e6f5f9663eba67e2d53b7d5d7ba5701ae9282e96860e2ad8d3f9 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..229d3409c8f4c52fb3e69efd7a1ca5ed0fa72aae --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e732a764ae8ca42ab2291d968464504f875b741d8e49c161d64511124165d425 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10c6bf0904b41ac992bd328038d77ce1423edd45 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:397fa029ebbb4137e01c711cf03009bb1d568d397363d22bb1d9f384e9997bbf +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5682ed83f6215035c16ed93347ada36521dba05 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2555ebca8af7ed613e9bc54677d80f708c13d1f9203ed1d59b043ce65558c99a +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fa69544bce12bf91e61e3b132927527c23b0ba0 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dca9b81060e8f9eca7873f5c3e7ba0a42fee492f561650f5859b33a08dfe7d9c +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fc93a32c04dae56287e18c3a2840298767b7a16 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f529ba5c5f6a533f5dbbd3f2656174866ef17b8d263aa275b9830ea7e1ba01f2 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5eee1b2f4e6e3f0243fd264aac149923d8565c0c --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2866ee2c122291f95f5d402e5bed6b788f8b4605abc4b31383a136c642fe551a +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..699babfd128aea8e04072e3ebd84915a7b351bcc --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b571ef4e676fc5b182a4d4cdcc4b1035507f5a78b600566b964e6db456492d2 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..421182a166794cade64e6addddbc86de717c8b7e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31d57a5deae66326f1aa9ec76281d554a070297353fe694e4e1f3de4b0195d77 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc5109a9588272d6b0ccf768c56172b23422be1e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffe6c9d2449813900ab6c04baa9225310cdc2a41500d6ab6aadd7556f8ce2abc +size 199058850 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..562d7225b36d5fe143183df28f6e5499e71c82f1 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:689d1b197e9367232237edd4b0347e048efc7e9e0326671df1dbe1863cc2057e +size 199058850 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..776578c31e59f94864940a792839f7fbeac0f42d --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:118dc87bc5e23f184d2afe147747ebb8e22949af4eb85dd96154826f013e9322 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..822d215ea9e413b156925ff9c52a9bd035ecac25 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10c6cdd22081934c34c9e42285478d9d85e038d2c0e68ed5331531bfdc25fe68 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b96990d7960cc917f33afaf9d6514371ce93d10 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20428b8867e9e989bb86724ea97a561b95769c54726159a49e6efc5c3ce81d95 +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cc5d5d9f8fb4d5de45d04efa6ab1904a66002f6 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c398a466bfa3ca3ea713ec021c0435bac3b26c3607f96c17289410f8dc04caa +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e41822e01f82f96820aa4eed315a085594905c51 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:865140d6c1f04b4bbc134f3840f5a4b7652a674ab20cb6b7e1b19ce35b4e633d +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00138127d598abb3954dc25d881fe677b88639e8 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aca2b894e1e2dfb28b943bd1e7c697e17fd5e5691fe8c66eb6c41ea8c1035f0e +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b48091c65addb2550f6cca67ad0c3a2cbc2b3c76 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cb8f4566591b5d60bb86d3aa67a054bf8417733eed5d97df16d52c96265d46c +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f7167bc0c65eb5fa449965e66851b99510693da --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2080365abf787fa2e83129f4fad506ce133716c9e66ec5584f0121668b16aea0 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8af4459c3ba1828885549e81ca6dd473fdf150ae --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf5000f6bc0d9c054a4df490dbb9c2b3240b64f144daaff739273fa246736845 +size 199058647 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5a60829d22f67509c5c451413e0d97049e31672 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c54905592992fed9e88811139ddb74c01099f7297d69ade765995e4e344c5be9 +size 199058647 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be44c7e3402dfef817e162691720d7dd137405e8 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7ea95c9066d003c409f8896bcf3caf65a6f848ce8f2b825ea65fe2192517c7a +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb698c733d85fd0c8a3322f1db351d9c96432ffd --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fe76be357d7309412a3563cc31b3f3d5fa363cc8d7d76f5ab806dbb1bcf2684 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce81948bc2351e159a7ba28ed9e0eacec1f92986 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a187dc0c652fab27c35446edec93d245c00067ee5784ff41e0189c9bf645a52 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7be269d49cc3940c0ba16dfedf66bbeac34d4ad6 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dffd034c579eba52e07a2de776d51cc28f409461c79756d4e4bd69edfa8124a4 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdb976fe68973938d8d2282c4a18c9d6e5bd5e7c --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fddcfa0a740da37c114ad01667e843f9855d1975a2158b27744a14627d25b2b +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e43d5a9281b9d7615ed4320dd29c2338b1e9b22a --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dca6d8a30c2c97b2d5ffc4fe74cdb0432e247191017b60e82e50cf61fe4eb38 +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b76a96910a2dae6634f6c6425f21dde8066831c2 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35e71a1c47d0170f5853682374248d1c2429bfbb11e9d676a50217f6f1d6793f +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11571b6f3621b32ded2c6932b6d6fe353edb161d --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9f3aed018513fcb1a213e628ce2d9c7b5a007e6bde8d0bca213eab5fdf1f512 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70f8da56acac27f5af5702bd458e2992d712b4aa --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef9d637750acb2a8fe241b83f89a84900e02b7a92c7392dcf1f3b8e8f2587fcd +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..806f28cc0bffd5e6ec9fb0b21cbf3fd877d1c6d4 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28974ec5b50cc41354443783122c4e960099c53984d43b764d2bac310c58b3bb +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..288bae07b4be3472282bb4306dbe8636e3551bcb --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59318c724f9c9d408c981b2bfdfaef8df4947068d483335afc3902e804188d99 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43ba66ed145c64983b3821b862620fff6dbed78c --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83e9ef3600c9c5646ca852ca692b317a8431518ece7512b1536611e0afa6f3c6 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c586fa4dc9602b3b8469e77c0c2f9c27aca465ee --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:146dc7712dbfbf3ba6483f910db05f0ba4333143a7305ccad5188242b7baabae +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eed709885b85e81e7bf2f5b9f99d4fb228a759fa --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c97786f810d2f7414f23a1d51374cae909eddb0b4d36772128706f8c2c1bef5 +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e16cdf01f3194e83eef41089476f24d5d580630 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ea6e9013b60a50d9396e53a67ad401949ef98344edf051f445387c098af551f +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dc63a551d4463a05946e5165a94f3f911203e3f --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd439f3cd5e3e65197dcc2e307d336aa9feabd6717c8d0a375ac146f1b7b868c +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87c91e211f3b89f698a04e66955ec7442f8c30d4 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd93a9caa9b9b49bffa26dfbcead378c0e7b6fa8d3462a8b16c9480d535249e3 +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ddcdc0ed8c1d92a387cad4295fb40793b3a7cf6 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:164bf7c49201bca2a9837739b687d66a2cf56cc24d6adef4b1842da25554965e +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..855d74448bfa94ffdcedc6f435f806c3ecc5f767 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:101d2c746344286ec36ade8346e4b351d1cacadb56150616257c3ee41031d544 +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c032aebfb0f31bda8377cc04dfbac9c515578b7b --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47eb9443f77e84c77beb8913c3dc4471eeb72fc9407f96d293e82744e11caf84 +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89e6d60dbe19f3c1acc067eaa02f9bd7419cdeb5 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00615beaadcb48ef550f617082625cb91f72ea5c15aebfec9f7232ba96337e94 +size 199058647 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65b0ea6f9ac0837e1651a63bb0be66fd0617123f --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:359b46078cb4b6b8ee5fb776618cc3c5c6556a2b747dc4df5d34146cb57a292b +size 199058647 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e17b914524403d3feb6b5b5f429b59765def989 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:214263cdf59c62022c6e4879d2e3adf07a02717b169fa5b2d900e5b4742fd4f0 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..121a20d03be36c2d97fe51844e39c339c2b68199 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1f89f69f85227c99e994e4f00438a55e076127f528b0e423e94c70bfff4acd4 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bb2b1e495c07d6dd474607ad691fcafd8fc8281 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa65a57b0c6115115bae9039b065cb14cfe20d1c80f8d7685ed51afe099e0680 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd32a22e059dcd08a0eab5d31b1564ec36278b7b --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da8f427db420d6717a8a813ff89506686f79533b66287b8a4d0ba3e05ea44ad5 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0042ee35ffeef86b7647fdf02b3fb28922692b2f --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d279ae4cc28eaef4c86a8031acc3b224e8f20713e815ecb6d55e15bc1d30d839 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b40df39fa2c6c2e2bf59a755de54413bc94ebd7e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e0dced6b8c53383b2b8496524fca0b343c5eb814cbaaabd0e3c7d62bcacf999 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41039e25cb5a06e18bfe70b16627b6ec93b9a97b --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04c6f3f570e174768051b4bbc902075415fe3ba6ad14b3f1980a2bfc0a08eb2a +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a290e705cbf8baa286ceacb34f12f1af966169e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:332e603db2ff69f7e312e288e018971db5170d0f1dfcdeefb8edbb8261e33d26 +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2bba35e5d42b48662ad4b1fa7c922caa7a1f2ad --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edc0ba0dff349e544a957d88cf8e4297b3e3a77472835fde4bbd7b798c13da2c +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d02d666f9621218bc7b67de5a371ffe942d4a521 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:665477e1bb9526f300a509943a58366c7684bf0175b2772a565a837b05c61f38 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ee8d11135965ca48a455806332a7d0bbae11909 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3075d5e50a1a185e71c942d92464f7f6fb6be30cd4a0849362056cf437457a49 +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ade3d371e5b7c8e7fe5662b2a166bfc150549581 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76126aac9ade646dec60fb2f1e73144845a3efdf599d22754e65359dcb87e26d +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..034355e1cd8b7e60e6d1dd00fe1e86834a013855 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d57839b53a8804903c68afe2198ce31e37601638e9fc90987bc61b58456e7f8 +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8243ac0fd8876439d571f1fff1ea671f950d2cc --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:115897afd9da0a1543e49c9f97e69513f9777f4946cd3bad0a41bc01122f3f3b +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..597a457a15041c7efbef047f4ea3c38c061bd607 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eda1bfc1a9ce9d0a316db3e1ca96bff5f9ed7ccd8d06a6e0e05b71f3a352f20d +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60119bba975e29563fc2411ab17e93f4c833605c --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53066514ea9673113d67f5f1f649b0439f32791996167bf71570f892b1f9e196 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad2fdd81521eb54a7f8282d85308731cebacdd07 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6425253d76f8b403614212c312ed5c3eee30b85eb24f7cdfedb540f6943201 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b14d79f8faa4395fd0525970a65a1a551c61151 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:320c2302f992e8c1a3067850ef593e5ff655640644f4820c5391e844612ede9a +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71f30924655d171ee4a80535c42421f1daf791da --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb699437408c7da1aba17831b27cad8647a75e64f7c6aa246b1112decdf9a5ae +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad84fecb8dd873d155284fab1a44b30063bc3f6e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d8b9613bbeab6d571101dcbbc4b54dcfa9237bdf17bfead43a1c49a797bd232 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab9d42b4d5c9a41c51c05c9c7b1be57df1b6078f --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75dd69fb6d6af391c3f409f6c4989f14234b2337aa5bee59399750393977b395 +size 199058647 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc9d1b51691080bb6efbce72263767692dc9fcc1 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e11591ef3ba25476fd7faeefb5d61b094a09c93b599d1c22af72d15de8ae83d +size 199058647 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..621c5833bb2f6b497da660dcbb603801375d09f4 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bae829e7149dda7f53ccdf5d1d8c297ea4c2cae9180de0412e4400799b33ad86 +size 199058850 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c74e859495aa47880a224360ee2e3601f0d1e64 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:411ee7e3e25b06e03f5ef84812ec9cd5c53d677e9609074a1e75971fd5e25d14 +size 199058850 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b85f1449c6168448b2457e79fd1ad657ce4ddd9 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fb3be227154a3ef6082e8ae73c6c3188f2d53fc1c537630294091bd769a4522 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15283752c3fea5b897e0b762131a05a84eaf6fd1 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:945760850f4342162dff49a7f7a5b96099524a2f4a42caacdd26c46446fb410a +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..748de7208a07260cbd2b769f205d358dd7c3ddbc --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7331293e8d89d56270eae0ef61c0858cc1c6ec21501c6bfac780e8d91479a6e7 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cac67a3c750dfc619f00772f6f9e30d02017a69 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77313381d47a355e4143f9a2f2ffee2d01881b185cd4772dcea5e1f9a00055a1 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d00eef0a4f8d7d42dbda3b3295286f7d82b46871 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99b43597ecc4caf8190bdda68d046a44156d768dc5635c3d46cf64e83cda1744 +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21f1c4c1a95c5341aab0d802e90a3d1ccd1fcb4d --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f547b99735df72cc0e12bb925592d7abc2d405725b6b481fe6bc0d060cf1a6f +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e0e4b45f413676e23215f058eb38b89549a4332 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a100acb78e3c147c7146d3f863819c13fc20cf79589eb029f1e240be0743e482 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c704ed976618bf02700a56529fd5530fbfbb195 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:801d68855089531dc3f74527cf3eb1e85e3f3fc0f50c4ad2f82e92e3e77d1f50 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a87cdfb074087556da2b4a8300f7ba06201671a --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38239faef183326eb4bd5d292b1d4b990acfd32e5042d355734334a68e584c4b +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d4aff375f5f95ad0635cd6e68470b785dcb3e38 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89ae988a3da134735a50bd538a8fa59696d61600fecff4df9eb3e9f2c10efe50 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..219ebfb86aa4e4849b21230c3b6c8d3030717aee --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1af087ceb8ccdd3a3154aa9acdf256cf7ffc419c850ac4abfb3e1559e330cee +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93ef9cec7df045564b1e2569d8615cd0ef7b6372 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfdb2bea221b52feb7b8513243ab5adb69f66810640205ee5e77ee6d595a8e89 +size 199058722 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1b18e033830d8129b1128cb97cd1d2fc7b23896 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b1aa36d573dc9342f1cadf10c4ca6bcb8c78f95fae35cfe58d32d92b1f01e0d +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34e353ad4621851b3a0876b7fed588bc33352848 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72cd655913d73f0f5ddd521f69598d7c96688a641894a3b9764978b4baf67562 +size 199058786 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e61399b83631a4f7d0b1f20eecb521854035b02 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:979d758749ae73886b681a1f8eafdba05af1c97f8f87fe7580deec562cb86adb +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4060a881d71fc42bd3ff8229e0cdff96b3313daa --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2bd6f1b30770e04d054d186482abbb55993608cb6a71801033413a3130ac204 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a479922e20b4b9c5a45503540aaa2910966c7ac --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:283a08e95f495a4e568adb365f8d5bd33a9a0425d6bcb548eb2ae0ca9ea95656 +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2b1ecc57e5d92d13a37e51fb56241b4ccd19538 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c81a0aa70db8d163e12a04876aaa6b92bca9f9cf4cd5f90d3694ecdfa64483d +size 199058658 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f027b17a697897e5057afe31611aa9edfe10fa26 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37b28bb773b8b3251b9de3458b2df21e94d5b7a2c775039865a9730b36219491 +size 199058839 diff --git a/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80dafa5ee0c8a91460c1423c503b2f32936fad6c --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3f7bdf5f4bf3bbb367486cf3e5b948b3ab98d8902b7e3a4fe45cae2a18462c8 +size 199058839 diff --git a/4b284b28bc4seed1/global_step80108/layer_01-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..585f9d8a8343854a20c3b86046cfae75e6edb3d3 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e017ec6cafe6c33dd527f89b78848fc1d677cf05d7f6a1ab6450a162787eb4cc +size 167511299 diff --git a/4b284b28bc4seed1/global_step80108/layer_01-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9afb71552e42052984d199d3dfbebe5b15d7a672 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3272706afe21f2f962b2da321278aa4c461ab56dfb7a6b973e75e50823dba34d +size 167511299 diff --git a/4b284b28bc4seed1/global_step80108/layer_03-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24e08fe505891a1d7fa411cd1b5b553dac80a764 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:880eb5da8abe3ee5f4ca4414e73d632a32f37b0e923acd977dc1207fafcffe5f +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_03-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6396f298e2f587ed204b0fb88dfa47ebcbcd811 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:765ed4a257c0904a59c9572bf241cf4a9858cbf5373b35efa11cef2de04bad45 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_04-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9acd2188b60fcf949be4f9cd852d0e636f0f840a --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bedc6151712f8a937f200920b9f75403d8911f92df35ae92a0c1a892cb23317 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_04-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2eca7d53072c3e165b63ca39f023eed21e147b9d --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e733616b934a5e158dd89df21c49e4157cca45d070a8d0f4b3ceb2224ba8280 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_05-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2eb93f0a614f6aac304948a8493e4aabdfad8eef --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abaf882ac4a534ba92e84df9974e59e241e15c9a61d99074a4391c9b4427344e +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_05-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..041dd54a0f250accf4925900cc619c4ba231e808 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5349317330a1f8aad1b78c599b6085b026a6ac390bac94cde1cdbae5c8dc570 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_06-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95f83fc657e0135a3dad693cc7c70bbd22ee2570 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6af08c1355b986cbeea5141c726cfae5387e531f9d0eb724a5702292c5823139 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_06-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..834c1246b925465f1e8ebfc9da484551a19f40af --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6590cfbbe6e759a2d7d4eba5ef7574d53076f4a6d18e1f9749e643bb972964e +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_07-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25c8b5378982e332e4eb7a443ec6037dc2f1c0d0 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1261fb90a00b60159d65a9a4c46f2f4d568d06d7ead84518a655d783345aaaf +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_07-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..892141dbaa8a3b2878f83a165f06fa9a0df10c6e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f11c57c8e3b3e511fc84bff9105980d004ed29997c76fda89e9d0a014c9431cc +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_08-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa5728d71d7803d36cfe20a9d2fdbe32f2e19518 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1429a6c60d1927c9919affe7c7f3404653afc105a3c92505bd85fdb6a0cb80e +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_08-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbc904a534c14b293151c7b5c6cd94463078cea1 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74e50569a8a891d1162f245899c9684164305dc7e63e53dcf15f75662cc7eb40 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_09-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..764fad4d6537f6bf5e2988a5c2bf5ed145b874ad --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:072b3c446a431b30f70d343e3af622f8b97052b017980b29d6c9aaad72d7b292 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_09-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf73cf3e169fd0b6c0d72f31db56a35c84345ff9 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d6e7b733e9e3e8b52a72be57a469a2fafcdb8c78ca6aa118f11e0e834726e38 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_10-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..139d4a51cb3057b62461706eb455d6f7e06c1fb2 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96543a544b7d3724468b85c360b50a75a90a8ef5b251a70b9c5961c59215c253 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_10-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c302e86a030363e4a464cc1bcec724e89751feb7 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de3bbc30a04d9b559832cf71752a53d467ec44ad8f922c75eea0df536c28c73d +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_11-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..259159043ab2a904b4b3b3c5e2dfa1092aa0843e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe84b970f2317c32c774d901891ded871a4896e211e3224351e8c7efc62c0dbf +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_11-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66a9f34e3634e5968e24c762e02b134af8a6d9b8 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afe1c86b95f96f8d2b325051279e436ea7327bcd861b612045c20aaf98f46b53 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_12-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58e87a4cd4598624b1ff1e8c1563a233a49ea58a --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a82fd54f8a9dc104824f07501c20c6942ff3cda3f0e5b3db7de072b160615084 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_12-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9405bf85f89c59b4cabfa3838633ef0a2a9850b7 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51cfd3835bfb24173e0364f8e035a760719f00ad3e06aa088d98cee6b4be8c71 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_13-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccb9f3ddafaaa575b0835b4bb04dd31e81fc5c99 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d19cbf275a03a79adcc925c3ff12f966d13417a5126bb0754f926c35c869241 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_13-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..426fab26f8c9ab0a1251dd8b82c7fb3f55594df7 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6769793669a65b31847ede99804df20027552e8d87a4d2723b44b3f138eb035 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_14-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ea02a86fee6af37860aa2bbe2669f3752c4504c --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d9e5bacf077e3695bce978a9704d78c55c29aed0131b171d6cff0fc18742a1c +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_14-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84395f4ac30069384d3d271aa8009ed14092db84 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63e5971f8f139089b90e9de1600ba53a4032cd34ecde774b637725893cac2553 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_15-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca6ec901b5d6e448de7f4db3d2595a5d980de0e0 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ff68ab5b41739762e6aada4d455bf4f966380d0e6b2d60fc49c60118e9f893f +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_15-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03df26c4c22d3d6b6e390674b7a5d5a85f4b4bc1 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2211afe9ba884ae558fae107477160d8ce1520c0a90aa273a8093370e09610bf +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_16-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..691e5d69f4085e410256ec5e2d8aa3a9197f3f2e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:932d3ffcb3c715ace72d1624df00948a5813f6095a4999951a884ccf472d0ff4 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_16-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c07aad2ce3d980d4783db754ee43cfa65c0a06a2 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1873c7717b7f58738a0b5d3806b92b6e5a72416c2567f60e7ed847e9645972c9 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_17-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccdb308a43eb47922c12bc6143610af00ce89b7e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30287a324a62cf1551585fdcd48b6c2be6933496ea32e4527df8a5bef59533ee +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_17-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9584778f85be33bb2c07901e99e670861b972ff5 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aadfb3c490c7d4f2e86e6aae80521de658b8f8c9ceb845f2c1822874dfd56c3 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_18-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4edb603df002796cc91d246c5fcc2a6ba0c8792 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f18611104f8030e1bb24a63dbd0f15286365fb74f9b4d9dade2ffb170a7e62a +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_18-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4071d631568d0eed36e783f8d33c503fdb3565b --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e82e2a699fc4e2b9d9fa7d7c3745d3550b6f4bef8c2ad1923b9cd9fb38fd5cf4 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_19-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a484aa69338a032875d811f71c2e8c04d731bda3 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90e4b43adb048e30e59d22f2c40c4a38214785f4c664b2a8c60f7e531caf5e82 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_19-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..662f14eaefd92eaef411f89c39c0937ddee141f9 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcea8c5a2f043fc1db079d91c2bb80222ba5e504ec14f3df3a0b9bf1e6c85bf2 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_20-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfbdea1d90d68bb7f32ca1cb6033be219dfa01c2 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17329d094f277410fbfcdc69bd78e7c774324f425383a72bb08322b64915b3ac +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_20-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1863058f1daba23f6016f2dbb06ca9aa5324f8a7 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac398d45a1903675b7c51952b29db9eb164da0c6dbbb42ba4d226ed68184f325 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_21-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..597f5ae22a77026f4e8b148c7be3bf6963147a6b --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ca4947f133d91d16a39e3e06885aa9cae308e163e5fa67d161ad13c7f4f1331 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_21-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd8a332f0a92557241a699170a799d99427af420 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9372b40ec07f172f3c0778c8986812c8cac41b918569ebc6dbc061236280a98c +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_22-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59ae8d036358cf98472058c779897571f3ce3b35 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdcbe09d4a1240ab367afcb5698d248f5afe549b94237f51ad3f8f2cf0667193 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_22-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cd4066ebd6439e3f4771a6cd7230a85671af263 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9376ed055e6bcd63d089fbec262bfccd26923114aff17a905fabc9dd447636bc +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_23-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3f78ae44514facfd3961e4a553743bdb5698abf --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d26556a192fa68205cd6c688f4febcee14e57df62dd8c4ba550f9d4848e318b5 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_23-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1a64f0a7e1b70481bf076cc9d8a893071965166 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05f567abe91381ae210aa3126670bc4482816d13beb4e844cbf073e068570bd0 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_24-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e53477dd1498fefc9625cff68abb733054bdf9a8 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b53da575faef40366d6ace85e174440443914a85d88a4486e097ccc9d92a295f +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_24-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6eed9ba88aa1b2a9ff3c1fb8960d5cb569accb8d --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c453ee84a4e34ef416ced07f20f4d47809238caa191bd76c7b2db5f1f7545f22 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_25-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12ec278a33c209c649ad76bd9a9677ec68daad9e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ff39a45c34f471e2737edd4467c90ed814907400f4ab778fc2ae60cd6805778 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_25-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb4edfdbaed181b4b06779b1d543bac6b42735a5 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ab8916b3ad9ac8948f920282fe1056bb37afb389df590267062a61c447a2d37 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_26-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..871cbbc8df51160e31e1ab69f1f9f7aea441160e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f643f31b21565cd052490392b52b22e7db5dc2156207fdb59cf2ceb1f11c6d75 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_26-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4ae0d642cf4313b196a5b84e981e185dbbb9a50 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e17af463448cd25b9e963dde21056e91846ea154bbda32794fe6adc401c04f69 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_27-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0cf94e8b02103876903ed605c0806208c72a6f5 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9a2cdda724617b998aa13dbddfc47338c8c0c138de74aa4e59cc3b8cabbfef3 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_27-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9102ceefbaf83d5f785810bd62d17abd587567ff --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16db0e0bffa25a71b840e944739f37870af30591f4cfc439cd9ef6e444fbc5c1 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_28-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67c3a2feeb525337c3781dfce8c9ac36c87f820c --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edabad7320da2b6a78627eb65ad78764e98319db362451a12f5bcc551d7d41cd +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_28-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..868649c23ad4381c23274dbeba2169c6e3f3a920 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6183f4f3a68286c5f5f51f5cd5bb53651858cb0c5572f62c92f4230a80359816 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_29-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1384aa5143ac00facd3192508f02d1528f48f1f4 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee32ab8e4b09f176d067dc72463fb378d123cdfa362596ff7c80a1c4184e8a75 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_29-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aeabef64287e64c7d59e8c0d5c1d87398ca40e66 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1aaf02aa7a9dcb704523e90462c9be532b0ca30cb955b31cd9b155241d8f5e3a +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_30-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9de41318c67dd72a1d89d3d848c6c8fabbfe6a80 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e32586ff47c54962dbdc07911f3aea5b633a63d414b740b67f04b4517272d68c +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_30-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..703fa74c4a0a4f867b61ad370788ac4910294a44 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a014c0feca903b6675c5ef772648801e2f2fa03ae4edbea1576b0ad12659a3e4 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_31-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55a5ab0dccf0d94fd3405dab2c3fab2a63b0f8ee --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e407473aeab3d86e45b67f2e27bb3231b4d6713dba17f0fb0da54b883f7694db +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_31-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bc3c6e33b24e2e3227becbc31255ffebb13a258 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb6206543f8d8329cff5c6d666f29dd66610c48ae939e0ce4afbc1d7716be307 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_32-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9102d23b0c7844c34511fe7c91d298323c26946e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eb4fe3f0f8680eec80d9336a07e51a06098fcdbda61ee671cc7dbffcbf52109 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_32-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f66a5018d987e31084d54f707b019c45e1103a6c --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:375d05b84f83dbf2684971bce2093bdb4619940a918f99f47aef45a6635ead6d +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_33-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c4a3c2fa70af01afb751bcc4ae8422c6a16947b --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d5325eea6085d60d0fefd8bdf138f6e347833c755ee17771bc53b5736e0e431 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_33-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..657f78b76de106ddfe89dc798c04b249f19a8d39 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:726f531b57873968db26d690471dce0cc2a76b666dc78fd4c5c0af0a426d90bc +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_34-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed1f99957b06b21dbf8055729ca7b248779b2a58 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72e60e5de33eb89a5228b569535b4b76d224c9d58074cae0d22890053dee73d5 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_34-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2de8e8a866b1aae710170d7ae4de9b04ae1114bd --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0224f35f4f52909983bca07f7bdda4392bd92fd5b1de85b39e2e0c3dc0d3546c +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_35-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bb5e31e85a0ec125e6deb4d5a213a198f141233 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34ae06ace5113cf14383f9520c5bf86441f292327042e62914f30d3da2efc38e +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_35-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7f66af012877f714c5d5d88504a07210f231e84 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c32a825df107cbddd63501b81ac74bcda773fe81b02b917ef67dcccb68e96b7 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_36-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dc5d68b39dfe2f488a37e6631593c0a9c2c199e --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7575f51a9bba13d1c95b6f2001c877dc6c43fb7049be539811f6dc9c7ce21163 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_36-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..858a5e024e0e639cd1aa50ee822688fa2b95bd8b --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0edd7165bd1203f7cbe243de317bd94d60fc83fd23f8a11bc3f8496152d0e48 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_37-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..934f852b59576424d19a63ce3a36322546f11a58 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6945f02a60c89a5ed191f4cef622f9c80bc7a20bd365158701109be00bafadde +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_37-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e84c22a9f6a856934ed76f6e57bb838b1e8cb47 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee376eaddaf6e9382a380be04afecc2502c5182e34862cafdd2a9c665d891b49 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_38-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b841aadfe84b44cdd8922c54f479b77e1784b135 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85823c5bb3216e2502cebcb37bc38d3a96a2cede1f597568e6d895801c8e439d +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_38-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6596a94c07503040fc9df4b9c1894a4016033e2f --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46ad7aeeaca8cb4f5844e177578b7bd67f55c559276f738ae6b24e13f49e3410 +size 113308931 diff --git a/4b284b28bc4seed1/global_step80108/layer_40-model_00-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6684d956cb2dc7927d86ba0ddbce2d74eb1447e3 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:698fab32e5ac0a56ed2ec9a93c9cea626519032d40aa0039267d650e68fa7bb8 +size 13507 diff --git a/4b284b28bc4seed1/global_step80108/layer_40-model_01-model_states.pt b/4b284b28bc4seed1/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..489d24773afde792fa68ac255222404dd80269a2 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dd8a63cfcf3eddf279398e286c6a8ba6ad668f1794629eaff81b4923e8125b4 +size 13507 diff --git a/4b284b28bc4seed1/global_step80108/mp_rank_00_model_states.pt b/4b284b28bc4seed1/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06b3e0de3cca2f5faaaa7440dc3d57369183e6b3 --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:551262084618c907058bd1e5d5da3e147bb9081e6568577c91d990a8199946af +size 51507 diff --git a/4b284b28bc4seed1/global_step80108/mp_rank_01_model_states.pt b/4b284b28bc4seed1/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3b70233c0082851c4fcef8712353372f5e4a1cb --- /dev/null +++ b/4b284b28bc4seed1/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b3f006937b7d724f76fee2799c66866b9dd3df9f4c1bb8d71e4c8ab976f9557 +size 51507 diff --git a/4b284b28bc4seed1/transformers/config.json b/4b284b28bc4seed1/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b28bc4seed1/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b28bc4seed1/transformers/pytorch_model.bin b/4b284b28bc4seed1/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..04823ff782354f09936e6f1db9a4eb76221cd333 --- /dev/null +++ b/4b284b28bc4seed1/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:244762cf80deb1fe197fad31445bb6bb81be4d1de0dae123a44334a8bd9401da +size 8781203669 diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..4c55741ada8a09c69daadc10d8cad237d038d086 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.33153388648094195, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.033005772984634425}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07122303608863641, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014591848220124259}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.30715399283349226, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004708720401522559}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10892120808244464, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019623579408930523}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03301457183266829, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008587185375204866}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.14854387481989287, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003193281253509643}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05087917177498001, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012052999188796845}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06820659069603296, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013384312711305548}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.29787923352571516, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004614486799091354}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1046596223130991, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018274939775881785}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06782306790846614, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013642733366910549}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.29321572118705336, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004444992160741671}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10379069725870145, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018395610209924003}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..67ce34837e13f4cade947e2a929d20fa56e4b017 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.4390216732028977, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.02835432276037686}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07291258825421418, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012781399789461385}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3797532045177941, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0054586371665182355}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11512333876359498, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017974110536525595}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.032868611308100475, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007540345266181282}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.18168266286903503, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0037422324762068537}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05213699889610434, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010956033295937493}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06806601322392085, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011368722533979258}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3553819785767932, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004968399489043776}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10756044811692632, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001603262453041204}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06910714253449175, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012031621148103201}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3583493585506855, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.005014235277134646}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10900979568571047, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016850432132498889}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..6e484094036a68486c3fdfa019906cfa29ab1340 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.49541929016035524, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.025797242026580104}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07266725444927156, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0011715118352015903}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.392286147400258, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005249827988828273}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11565855599729363, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016715046204442972}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03317260466126409, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000696598360418341}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1942947439780873, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0038612870273807783}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05321206929632585, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001036190867375003}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06822626222269808, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0010788080778881023}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3658441206667177, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004744182177069523}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10849753112690429, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015324126427550334}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06911868824793722, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011075456309651759}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3723196892015273, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004901964131441716}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10994078611093397, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015743454993528729}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..c07a77172d1cd03e5cf5eca13cb3f53cf916407b --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5491960579253196, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.039648429482997495}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07160364848852087, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0011783430176818728}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3927842849413568, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00522433426165448}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11408517238759823, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016665220312756322}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03296327776337767, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007230725204977183}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.19533584043693603, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0038707201775201655}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.052818017804867626, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010623028200577843}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06680503273038688, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0010837322892585253}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.36333847242647704, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004665099933938704}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10630291986513662, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001526814085910438}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.0681283239197468, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011259165449605442}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.37225854905210065, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004887731193821206}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10846020883153136, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015890200535555973}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..55c91cafba375606b77ab756042bcdd41ddeb00c --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6089661489117988, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04699623217901871}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07213518977803757, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0011476197609056422}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3992239446300711, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005128894156765551}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11514000344336653, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016184571331864207}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.033158630338207526, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006987407020504501}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20032190789144683, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0038236156171148734}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05332935191373514, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010277690042407401}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06683680650160255, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0010578019098300508}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.36520991395591773, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004493220490046675}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10644937066363529, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014847353193029158}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06848539496662703, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001092766850551142}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3773679563441165, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004791768779964645}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10920289975227614, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015389130963739533}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..786c6373f3f94e2df7069c5cf9df6626d78beb45 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6220539692203896, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.027241061650766073}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0712682874127396, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0011261508589404943}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.40368204669190927, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005176457083171882}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11402382459454527, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0015862357548837988}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.0332020137953197, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006861186130499352}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20677377146703504, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0039525209229281264}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05353546076223042, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010071474225918618}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06625798608998291, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0010442629568554243}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3704875696637656, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004602314366146881}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10577538472070054, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014621636026219001}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06783456627617492, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001071886270802083}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.382465197548837, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004842551860701479}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10844065292929861, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015071351512198398}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..f1ccafda607b91e0ab196b24e761039d27a67d76 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.15182550911429873, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018688893384549484}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2589242894485067, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026517724171458952}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1779625720124565, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018340890133845323}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.030739869666078615, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007500707956482545}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05422083314217582, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0013617275020705638}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.036223836197762725, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008360695449580615}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1163914580615846, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012923332758585293}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.20559642048990517, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021063218448770372}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13797458766444107, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00128706736916593}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.13832783036931234, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016858294437463758}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.23756775868205818, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002450945116586128}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1625132579484488, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016598158056400846}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.5993765093997294, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07506085369601702}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..5cae0fa87e7d276c31f5c4f749e5a732996424a8 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.18496096563065467, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002050002215955609}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.3135599264124284, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027341763298141864}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.21598714377615563, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019024221215778328}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.043438836648193035, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008698319584098167}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.07611495800976509, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016061241867093036}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05092387173534868, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009502922893863336}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1281515256406243, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001291169012274189}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.2264556395402032, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021416748555613593}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15160062635446855, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001239572009665517}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.17280855254177024, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0019099792075058242}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2938664218975422, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025815210408538384}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.2019926405301408, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017749314312316205}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.5200403089231775, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05693901717280776}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..72865c1f9e6ecc717133176f34180fd8acb59fc1 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.19241271397106163, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002086863578689543}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.32031046447154404, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027181669208385484}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.22231924312892618, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018757379527855871}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.048019665884255235, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000949724643152317}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0836751095859514, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017264035814644186}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05579012272313604, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010124966408794026}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.13376141964932425, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013725108527129226}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.23124667730229143, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021820014245572915}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15627127285797618, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012523054332758818}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.18081556496647747, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0019520981988559959}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.3025117234925768, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026055764102078075}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.20921146077018363, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001755514182451968}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.8246220069939314, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05436929747000312}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..a897216879304951491a14d35bd0a7337d8a81cb --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.16640193920440474, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002472882187893366}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2649663905434579, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0032993991901049875}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1848100615479409, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022579690258614704}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.04051313387433241, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001042560540352432}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06748612349747192, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016580523507809426}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04536872008122934, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001002873578150144}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11778833422399672, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001764546075584022}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.19297885421052255, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002524627264850371}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13129086818074612, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001545448883255699}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1560147423913123, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0023125754138923474}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.249482350470566, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0031348571322463346}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.17351085580896572, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002116003523751111}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.775126184527832, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04964262533072551}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..c79cbd0288f36472baa4f79448dcb2d97b7dffdf --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.05264325356647027, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019548941831179097}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.08637392317712084, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029446541600125875}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.05762199753523481, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019234101466023426}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.012435473489888542, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006697583811981027}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.022066243551567184, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001176386791377328}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.013932175935494801, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.000677479417971868}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.038774748862737, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014187651157647537}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.06558722529459496, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002298264781788869}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.042630350228712206, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014055059931358702}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.049317168459700536, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018317279159510054}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.08119886671766297, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002771971428999714}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.05397101577019339, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001795986537373056}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.6328100673630783, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.039922860842299984}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..ed6b71a8a3ebdcfacce3df996820f234bcc1d737 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.008573781066321003, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0008654762638624486}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.013672256166431493, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0012985268683484443}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.009114245109778818, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008561600546824989}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.001966748909838605, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00025417327235094497}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0033662241091160935, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0004534618115491094}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0021689783329266383, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00026415328416558304}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.006239534916325571, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0006307296825652261}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.010041041492697021, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0009608570474005339}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.006612705879560682, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006186105809635613}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.007874956167229618, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0007946305678768076}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.01258508198697765, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0011929631283971707}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.008378974054458118, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0007859574648450136}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.8294461842495436e-06, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 2.8960441784514307e-06}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..142ea875e7d9a2e81abf168f6828c790f6dd461f --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 1.4134342817933134, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10321165497606506}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.10247313979693526, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0016595089176992329}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.08798141485351638, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0020421795807805876}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.07268079919042715, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0013299276492676378}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.00887479842846684, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0005272736841464594}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.014404059874404535, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0007753598252854332}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.00993468622248673, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0005343002508124515}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.10002794388883973, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015746721314263722}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.08578186838136309, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.001963617682885378}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.07081998927780214, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012624377157260348}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.09505113511885002, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016104542116781076}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.07341402605300737, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0017014954492227232}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.06325547718223694, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001146593422118666}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..dd3c7f4be7ba1bea1283d504084bf05f32f42179 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.161361331881567, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.12372614680699576}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5102128961431266, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032435467042979615}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.41996959404299955, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003000739317309415}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4325678229581062, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002292323583369995}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2347486548964982, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0025124030520577855}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.18995161561629698, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002108346628324476}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.19587297305804474, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019046996832194681}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3718563664348661, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0028475505595708522}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.302335969435588, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002389554465547073}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3125033610005072, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001959745932298407}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.41834560442201607, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0030773847535100003}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3428712422996488, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027256967100605344}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.35360222601109786, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002221056794276662}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..753e5779288304ba4ce32205c65090ab3f531473 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.178478800336915, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.18720778468970048}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4641458682797714, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002971633166316723}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.45712689402679485, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028529123911751396}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.43564156295510353, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002087610230342593}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.21534769962339712, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0023043178046714048}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21108519516124935, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002144830729960772}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.20007291305638683, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0018220503474021836}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3373737455708324, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002541494576877095}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3312050835060631, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023578769935104662}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3154129310627208, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017997732274878523}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.38666807747150694, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002816195982796137}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3803128282949514, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002684776810203093}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.36253839271187577, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020879729234347427}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..4d139cd9a385674524fe2d08af0e9b1bb350a8d0 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.078551573988406, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1775440487553758}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.43295946805897406, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0024929063336741916}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.47117854558838085, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027664367541802696}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4326675462538715, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019582645124443902}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2009303237548315, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0019532985877392488}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.22075863091567335, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021918759824511784}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.200583189798169, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0017572494683324837}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.31641399110077373, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002147128833979884}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3443145885276902, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002348509165132024}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.31563666321158207, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017274457082887083}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3650689748250584, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0024222254606659755}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3971452452707439, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026671950920676476}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.36464056912358683, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002012766885114503}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..0370a79fcca062b839fcd9882987587c6173a8ab --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.26779671250681, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.20945092499394355}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.42504057259498224, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002302694388890242}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.479467443521395, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002694693864079371}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.43468339695150743, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019192301545953678}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.19787815742992643, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0018370754370625954}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.22626550198253664, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002204792167524998}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.202879451815592, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001765189527045149}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.31019836982770554, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001959650847184396}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3507681740649588, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023395609242667513}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3172808489106893, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017201307043284524}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3582038693968529, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0022423131040152167}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.40461547051620306, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026339178059616598}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.36655599606622596, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019897208220121514}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..37be29022e267ad35833910377efc9629f4c4c99 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.056827999458564, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.18078644474517908}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.41637768269876485, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002227557311413217}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.48001165743040636, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026762804898328154}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4309560903845341, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001893293831351894}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.19341945111333012, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0017901333419283593}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.22629146190496788, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002191585425335327}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.20083246520570572, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0017445182528093705}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.303929949160996, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0018891083086755413}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.35261189373922003, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023727357497467937}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.31519997823452967, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017133598116412512}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.35227968062569365, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0021866137017689286}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4064043196987044, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002605112678915691}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3646984779801211, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001960028955951922}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_gem_xsum_article_DOC_summary_0.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..ef8923fe31f070a96c583d1bcc40cf5fafbbebc0 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.16347573034711765, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002235052767052065}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.361809595461701, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004450055018587551}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.21824095908596577, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025874062237003148}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.04080119463614899, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0013586822504416986}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.09489684727762387, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0030304863214365187}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.055096743612893836, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0017015215521108862}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.12349304284569401, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017244637096469517}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.27540408956152623, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0035538299823413846}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1649602106468539, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019703191216796398}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.12787359610941754, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018576292031407871}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2854470256837463, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003942621790562841}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1710468546463645, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022098555753275687}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.295517441700607, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09915357248852676}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_gem_xsum_article_DOC_summary_1.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..4f6057ee6d13d3ece2830de4f10518e729f6cf43 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12498263517558904, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018439932798174727}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.30997040065867815, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004377559967707829}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1759444559759621, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024983727013912576}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.023984343121594594, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009703036853821361}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.061937587800487796, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0025773754792855217}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03416151854233213, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013809223175216116}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09683506809823249, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013556223253912536}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.24217304938796147, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003372900627372106}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13659440083004393, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018529344115148084}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.099266332557722, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014699947767357671}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2484370722635638, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0036565129132140007}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14008466520947307, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020194523247221608}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.3192475830096537, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07504584122763394}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_gem_xsum_article_DOC_summary_2.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..97a5d7610a5dc5604704f3d3c7c60f9166903d4f --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12308471402675025, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017964024163926668}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.30420591170874123, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0042091034345315345}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17317479594583315, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024306874343318695}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.024998880277592218, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009660509776349401}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06368455444982171, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002497504245191044}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03548103421040685, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013648086670444103}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09766064805279387, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013763841420730348}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.24210898643660594, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003269851529578185}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13747942038634384, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018617507575533767}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09700451417856086, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014713838347837971}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2416228650888391, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003570749791914669}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13676635773915868, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002012262737653545}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.3941983933749893, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07778092606300743}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_gem_xsum_article_DOC_summary_3.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..2cab2eec91f3a96c07a3e619dd25da92307ebde2 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1238798362783257, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0020371925631676394}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2938277668513655, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004445484366807697}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17052015726603906, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026006019517768233}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.025223685922742684, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010126897278031643}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06217111485022419, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0025204701650283143}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03519128429327673, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013864951253610754}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09880564731360271, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015869573723169535}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2348719293167949, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0034616442328126336}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1359902514132361, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002000179300648128}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09736356730337334, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016253165748697476}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.23279761437533245, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0036609997549228836}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13420532702105284, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020736765057759775}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.447300262525524, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0647434385662156}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_gem_xsum_article_DOC_summary_4.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..96789d307aab2c398ec3a26857f47d211a06c0b4 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.03916972701362441, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0025232037599719035}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.0705187151734879, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0041033703238095975}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.04587682793613896, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026664431362576437}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.007496872523694719, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009023223955939198}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.013768613253728622, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0013735135943198867}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.008749872613988179, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008910869873582503}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.03154543945422246, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0020528668246378276}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.05618648837737757, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0032188263348742517}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.03641897598226805, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020590368431718546}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.031542117455926555, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0021071412880804725}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.055916896434064445, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003269542426299847}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.036286088799465356, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002099169574521433}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.6399540831907461, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0665572258832638}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_gem_xsum_article_DOC_summary_5.json b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..0ac03375281a19d937fbd82555481b6576244224 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/agg.4b284b28bc4seed2_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0030262317078135763, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0008861957572341574}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.002682824319713878, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0008349754331976099}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.002797377262876916, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008436395309397021}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0005864695792553728, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0003600452195293311}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0005925913708932577, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00039524060846512425}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0005852654722501501, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00037583234587724155}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0023057883289935395, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0006706823613650493}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.002115155017368573, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0006595785512806381}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.002169100825975142, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006545600161608136}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.00240202126410433, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0007072328465422081}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.0021726632985610644, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0006770960348507971}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.002243893464585761, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0006801725997564016}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 4.294601973766167e-36, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 7.391409466573723e-32}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3930cb393b2d4e8b735c1eb48903e41755d784dd --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b60dc8872129bd11976567b261df994430504eadbcc4f23f801ec405c9273fd +size 4134729 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ce6735f4a1fbcd3f7ec970605afc5caf88b57f91 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cefc80832eb0015804cdeb48778fe42e7ce2956488579bb555e8f2f98dcf3394 +size 5142294 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0f1ecfb0bed71f36492d325c4fa8f7e330455951 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a53cf75923ef019b9ec0eaba261898ec51caa581101b0c4ec64298b8306753d6 +size 6043415 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3766568f70cb62612e2bdac4930a6be0c61f3bb8 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54368856c1854ac609c84ed31c593a84b3836f85b374e2c2dcf53cdd1d3a2a65 +size 6973084 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..532726a8aca4351caa8d0fba55936c5f593c5a8b --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31ff1580837c3481bccad0d7cec3ec42518afd54a274d00bd82dc23574bd6a87 +size 7876130 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..673ef0c3dffaaed4327ef0f637c4efdfc1da6742 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a5dcb3894272fec97efc23aa9677923c9eff8b2c23869f64a574db17e19ea39 +size 8794518 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3de6008d02d203d73bd905348aef33069e86f074 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bceff2da72d04d3606f674b71b76272ef21f432b4e9d43b5a6af071fea2f6d8 +size 7693993 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..92538795041d4ef7ded1dfd57f905698cc72cb56 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2463a21f68d4b51a0322e72dddd7630bcc3b4a065a0bed17c1084b101258606 +size 13325370 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0b19e48b529a0eebb4e4b101ad768e7f53d0feb4 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9615398abe4e5c7cb1a75537377f30931750092ac7f80c67bccf9ac4e912dd2e +size 18924226 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..df80236b3944d4cb56f1f9ecb916ad8f7c1c2fe4 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c3b8ed8df9451efe52ed5fb1521ffed0316ddea156fa697f6ceeccb8e3b74b0 +size 24340351 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..78e523bdc7d42812ab12d4fda1072a90ed3e9e12 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c3562fa883c3013f136291b4db95c280e59e59954271de84b5dba63f2a793b4 +size 29476803 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..576512ac54b6de9c933e5440eb8e27b4894e7f1a --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3836ffd39b8e9c542431e245f6636fcddb21710d0d8002cbf5c30838ca6a9619 +size 34800380 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5ca3b47e3f0c11b2ee4132df8a60f435c668f429 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a5e43a9967f644a113a7e675c09d4cb517b2ab9633333fb5407b36de2ba9541 +size 3983760 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d918edefec47872f0b4be21b4188bca4919eb84d --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dac2bbdd8d529b0fff07a2c3a2338342ef45a6dc64b06851b37f3cab53958200 +size 5052493 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3e4fdc6430eda2ce80d06850fdf3db65627e4ae2 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef75acec76f843b198ed2f1ac3fc6197333b8f988aade57f7f81b9732462cf54 +size 6208152 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2321bb9a6adc443bf2385e598a6fc7a63731be98 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d66cfad28c3927140337e465ac6a93ab668415be36eb9f774e68c7775c792e7a +size 7324671 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c816ba584435c8284e3fc1ffd9868b0d281b1eb1 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a4720633d13191c4a353e9aeb9c29ac0e7be8e02ef67c17b7a91015aeffb0ec +size 8415521 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..18ce9619e874521c895e11f021bb2fb1b1c58158 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06fa1606ee0e281d16ea4500899bc3d1edc2b2ca2533cc94c00029c73ae1eab7 +size 9513620 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_gem_xsum_article_DOC_summary_0.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..40547d58306d06bfa546006e35e62e7ab67780db --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2df15226353ef8dad4fbebfebc3f0f6c6fbfe4fddaed75f5915315774d17a76 +size 2817325 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_gem_xsum_article_DOC_summary_1.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1366a9b2714226d1b13cb383ee145e3b5c87795b --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b8de33f440cd743c58f116ace639cc89e400816d7bc143231f307937c0fbf06 +size 5105122 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_gem_xsum_article_DOC_summary_2.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..78de96c13b9933db7f42ecb49969f66c1bc522e6 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00c14bf2ddaedcad3c2e85d1c647c6cfaa1073a79912f5d1f781326fd43ad634 +size 7377287 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_gem_xsum_article_DOC_summary_3.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a377c64c268378debc0b6eff1f40628cd5d9077b --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d3b0354f4ee8ccdc9b2e05492424f08265bd45fd26799790da6926eea698cdd +size 9645989 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_gem_xsum_article_DOC_summary_4.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..774f95677329e8f7c6056685ff0c77537ba7223a --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b332fa9911e6b8a314cb6ce91be4192cbd3bd7fbcad8e10b96b65641967e0c5e +size 11670990 diff --git a/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_gem_xsum_article_DOC_summary_5.jsonl b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ae0cef7438218799253e4e16a621dc12db645e18 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/examples.4b284b28bc4seed2_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a184f503e67d035d57133c3617c9e387d6a74c0b6eb71a8ad2c28634610fb83 +size 13897610 diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..79d847416bfab2b5da52f1f071ac33dc52d51915 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.33153388648094195, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.033005772984634425 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07122303608863641, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014591848220124259 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.30715399283349226, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004708720401522559 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10892120808244464, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019623579408930523 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03301457183266829, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008587185375204866 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.14854387481989287, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003193281253509643 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05087917177498001, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012052999188796845 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06820659069603296, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013384312711305548 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.29787923352571516, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004614486799091354 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1046596223130991, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018274939775881785 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06782306790846614, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013642733366910549 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.29321572118705336, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004444992160741671 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10379069725870145, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018395610209924003 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..97f97ad478455822621029640d33440d97411cb2 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.4390216732028977, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.02835432276037686 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07291258825421418, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012781399789461385 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3797532045177941, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0054586371665182355 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11512333876359498, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017974110536525595 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.032868611308100475, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007540345266181282 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.18168266286903503, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0037422324762068537 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05213699889610434, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010956033295937493 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06806601322392085, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011368722533979258 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3553819785767932, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004968399489043776 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10756044811692632, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001603262453041204 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06910714253449175, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012031621148103201 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3583493585506855, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.005014235277134646 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10900979568571047, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016850432132498889 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..34b8e5b782b1ad7d031b04fa40ac6dbd909323b6 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.49541929016035524, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.025797242026580104 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07266725444927156, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0011715118352015903 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.392286147400258, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005249827988828273 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11565855599729363, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016715046204442972 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03317260466126409, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000696598360418341 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1942947439780873, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0038612870273807783 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05321206929632585, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001036190867375003 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06822626222269808, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0010788080778881023 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3658441206667177, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004744182177069523 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10849753112690429, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015324126427550334 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06911868824793722, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011075456309651759 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3723196892015273, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004901964131441716 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10994078611093397, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015743454993528729 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..e781eb00cb663acaa3be01523e50ec992272bf80 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5491960579253196, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.039648429482997495 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07160364848852087, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0011783430176818728 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3927842849413568, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00522433426165448 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11408517238759823, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016665220312756322 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03296327776337767, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007230725204977183 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.19533584043693603, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0038707201775201655 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.052818017804867626, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010623028200577843 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06680503273038688, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0010837322892585253 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.36333847242647704, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004665099933938704 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10630291986513662, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001526814085910438 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.0681283239197468, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011259165449605442 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.37225854905210065, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004887731193821206 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10846020883153136, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015890200535555973 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..98cf7ee013c3036de924e6df2977561a01df7814 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6089661489117988, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04699623217901871 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07213518977803757, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0011476197609056422 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3992239446300711, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005128894156765551 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11514000344336653, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016184571331864207 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.033158630338207526, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0006987407020504501 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20032190789144683, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0038236156171148734 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05332935191373514, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010277690042407401 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06683680650160255, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0010578019098300508 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.36520991395591773, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004493220490046675 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10644937066363529, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014847353193029158 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06848539496662703, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001092766850551142 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3773679563441165, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004791768779964645 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10920289975227614, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015389130963739533 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..da00ece5b95743f5173cbeb3718d5b59d85f2c77 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6220539692203896, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.027241061650766073 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0712682874127396, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0011261508589404943 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.40368204669190927, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005176457083171882 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11402382459454527, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0015862357548837988 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.0332020137953197, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0006861186130499352 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20677377146703504, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0039525209229281264 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05353546076223042, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010071474225918618 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06625798608998291, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0010442629568554243 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3704875696637656, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004602314366146881 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10577538472070054, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014621636026219001 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06783456627617492, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001071886270802083 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.382465197548837, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004842551860701479 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10844065292929861, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015071351512198398 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..93b33e9cdcfb00651ef3d279b8fc5d343d3620cf --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.15182550911429873, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018688893384549484 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2589242894485067, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0026517724171458952 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1779625720124565, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018340890133845323 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.030739869666078615, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007500707956482545 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05422083314217582, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0013617275020705638 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.036223836197762725, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008360695449580615 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1163914580615846, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012923332758585293 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.20559642048990517, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0021063218448770372 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13797458766444107, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.00128706736916593 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.13832783036931234, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0016858294437463758 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.23756775868205818, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002450945116586128 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1625132579484488, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016598158056400846 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.5993765093997294, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.07506085369601702 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..23a3614edb067ab7cf0aba521e939d7af9c5aaa6 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.18496096563065467, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002050002215955609 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.3135599264124284, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0027341763298141864 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.21598714377615563, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019024221215778328 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.043438836648193035, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008698319584098167 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.07611495800976509, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016061241867093036 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05092387173534868, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009502922893863336 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1281515256406243, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001291169012274189 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.2264556395402032, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0021416748555613593 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15160062635446855, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001239572009665517 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.17280855254177024, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0019099792075058242 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2938664218975422, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0025815210408538384 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.2019926405301408, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017749314312316205 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.5200403089231775, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05693901717280776 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..a637aee53561bb58f67835fd8784a0e6106a3679 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.19241271397106163, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002086863578689543 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.32031046447154404, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0027181669208385484 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.22231924312892618, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018757379527855871 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.048019665884255235, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000949724643152317 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0836751095859514, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0017264035814644186 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05579012272313604, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010124966408794026 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.13376141964932425, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013725108527129226 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.23124667730229143, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0021820014245572915 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15627127285797618, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012523054332758818 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.18081556496647747, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0019520981988559959 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.3025117234925768, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0026055764102078075 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.20921146077018363, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001755514182451968 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.8246220069939314, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05436929747000312 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..efca746dec7536812103e191d9ae7248f879f0aa --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.16640193920440474, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002472882187893366 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2649663905434579, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0032993991901049875 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1848100615479409, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0022579690258614704 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.04051313387433241, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001042560540352432 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06748612349747192, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016580523507809426 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04536872008122934, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001002873578150144 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11778833422399672, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001764546075584022 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.19297885421052255, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002524627264850371 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13129086818074612, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001545448883255699 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1560147423913123, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0023125754138923474 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.249482350470566, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0031348571322463346 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.17351085580896572, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002116003523751111 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.775126184527832, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04964262533072551 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..5711c87d74e613d0e1b22620e7ae5a0120abf86b --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.05264325356647027, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0019548941831179097 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.08637392317712084, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0029446541600125875 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.05762199753523481, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019234101466023426 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.012435473489888542, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0006697583811981027 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.022066243551567184, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001176386791377328 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.013932175935494801, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.000677479417971868 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.038774748862737, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014187651157647537 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.06558722529459496, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002298264781788869 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.042630350228712206, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014055059931358702 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.049317168459700536, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018317279159510054 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.08119886671766297, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002771971428999714 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.05397101577019339, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001795986537373056 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.6328100673630783, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.039922860842299984 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..66750605a7cd33459067d8283541ba59a81c0432 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.008573781066321003, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0008654762638624486 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.013672256166431493, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0012985268683484443 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.009114245109778818, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0008561600546824989 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.001966748909838605, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.00025417327235094497 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0033662241091160935, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0004534618115491094 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0021689783329266383, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00026415328416558304 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.006239534916325571, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0006307296825652261 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.010041041492697021, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0009608570474005339 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.006612705879560682, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0006186105809635613 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.007874956167229618, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0007946305678768076 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.01258508198697765, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0011929631283971707 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.008378974054458118, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0007859574648450136 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.8294461842495436e-06, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 2.8960441784514307e-06 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..d05510f881a2849144c481b2ec70c612b4c15ebb --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 1.4134342817933134, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.10321165497606506 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.10247313979693526, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0016595089176992329 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.08798141485351638, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0020421795807805876 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.07268079919042715, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0013299276492676378 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.00887479842846684, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0005272736841464594 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.014404059874404535, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0007753598252854332 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.00993468622248673, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0005343002508124515 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.10002794388883973, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0015746721314263722 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.08578186838136309, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.001963617682885378 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.07081998927780214, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0012624377157260348 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.09505113511885002, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0016104542116781076 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.07341402605300737, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0017014954492227232 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.06325547718223694, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001146593422118666 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..d14ab1ad991bafc904dc3068f04ef99c737e1465 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.161361331881567, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.12372614680699576 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5102128961431266, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032435467042979615 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.41996959404299955, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.003000739317309415 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4325678229581062, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002292323583369995 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2347486548964982, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0025124030520577855 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.18995161561629698, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002108346628324476 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.19587297305804474, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019046996832194681 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3718563664348661, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0028475505595708522 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.302335969435588, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002389554465547073 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3125033610005072, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001959745932298407 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.41834560442201607, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0030773847535100003 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3428712422996488, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027256967100605344 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.35360222601109786, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002221056794276662 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..41deac72e1128b13029271b22c827ad62f99fd5e --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.178478800336915, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.18720778468970048 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4641458682797714, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.002971633166316723 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.45712689402679485, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028529123911751396 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.43564156295510353, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002087610230342593 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.21534769962339712, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0023043178046714048 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21108519516124935, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002144830729960772 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.20007291305638683, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0018220503474021836 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3373737455708324, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002541494576877095 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3312050835060631, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023578769935104662 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3154129310627208, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0017997732274878523 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.38666807747150694, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002816195982796137 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3803128282949514, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002684776810203093 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.36253839271187577, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020879729234347427 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..df11ece526a86fd7f1848e0d8c6da204544c89e4 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.078551573988406, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1775440487553758 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.43295946805897406, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0024929063336741916 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.47117854558838085, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027664367541802696 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4326675462538715, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0019582645124443902 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2009303237548315, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0019532985877392488 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.22075863091567335, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021918759824511784 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.200583189798169, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0017572494683324837 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.31641399110077373, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002147128833979884 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3443145885276902, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002348509165132024 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.31563666321158207, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0017274457082887083 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3650689748250584, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0024222254606659755 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3971452452707439, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026671950920676476 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.36464056912358683, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002012766885114503 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..43a6b6d7f7544203a712ff0fae293e791c876793 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.26779671250681, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.20945092499394355 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.42504057259498224, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.002302694388890242 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.479467443521395, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002694693864079371 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.43468339695150743, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0019192301545953678 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.19787815742992643, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0018370754370625954 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.22626550198253664, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002204792167524998 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.202879451815592, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001765189527045149 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.31019836982770554, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.001959650847184396 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3507681740649588, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023395609242667513 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3172808489106893, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0017201307043284524 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3582038693968529, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0022423131040152167 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.40461547051620306, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026339178059616598 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.36655599606622596, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019897208220121514 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..09220e41547369c932bde4122f5374451e728731 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.056827999458564, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.18078644474517908 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.41637768269876485, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.002227557311413217 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.48001165743040636, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0026762804898328154 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4309560903845341, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.001893293831351894 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.19341945111333012, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0017901333419283593 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.22629146190496788, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002191585425335327 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.20083246520570572, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0017445182528093705 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.303929949160996, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0018891083086755413 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.35261189373922003, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023727357497467937 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.31519997823452967, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0017133598116412512 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.35227968062569365, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0021866137017689286 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4064043196987044, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002605112678915691 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3646984779801211, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001960028955951922 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_gem_xsum_article_DOC_summary_0.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..ee80c0bbd14b28c456ad8f59fc624754fae01eb8 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.16347573034711765, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002235052767052065 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.361809595461701, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004450055018587551 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.21824095908596577, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0025874062237003148 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.04080119463614899, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0013586822504416986 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.09489684727762387, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0030304863214365187 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.055096743612893836, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0017015215521108862 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.12349304284569401, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0017244637096469517 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.27540408956152623, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0035538299823413846 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1649602106468539, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019703191216796398 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.12787359610941754, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0018576292031407871 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2854470256837463, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003942621790562841 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1710468546463645, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0022098555753275687 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.295517441700607, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09915357248852676 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_gem_xsum_article_DOC_summary_1.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..457c1e9d0bca6bcead1cd5511e4d162a070e17d0 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12498263517558904, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018439932798174727 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.30997040065867815, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004377559967707829 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1759444559759621, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0024983727013912576 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.023984343121594594, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009703036853821361 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.061937587800487796, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0025773754792855217 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03416151854233213, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0013809223175216116 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09683506809823249, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013556223253912536 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.24217304938796147, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003372900627372106 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13659440083004393, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018529344115148084 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.099266332557722, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014699947767357671 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2484370722635638, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0036565129132140007 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14008466520947307, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020194523247221608 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.3192475830096537, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07504584122763394 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_gem_xsum_article_DOC_summary_2.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..6ec6f8b6f954893ce63f01a249f528d3ea11f649 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12308471402675025, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0017964024163926668 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.30420591170874123, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0042091034345315345 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17317479594583315, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0024306874343318695 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.024998880277592218, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009660509776349401 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06368455444982171, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002497504245191044 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03548103421040685, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0013648086670444103 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09766064805279387, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013763841420730348 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.24210898643660594, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003269851529578185 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13747942038634384, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018617507575533767 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09700451417856086, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014713838347837971 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2416228650888391, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003570749791914669 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13676635773915868, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002012262737653545 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.3941983933749893, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07778092606300743 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_gem_xsum_article_DOC_summary_3.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..2cb4e8656df885637dbe7113600c63df34b6a30e --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1238798362783257, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0020371925631676394 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2938277668513655, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004445484366807697 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17052015726603906, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0026006019517768233 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.025223685922742684, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010126897278031643 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06217111485022419, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0025204701650283143 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03519128429327673, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0013864951253610754 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09880564731360271, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0015869573723169535 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2348719293167949, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0034616442328126336 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1359902514132361, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002000179300648128 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09736356730337334, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0016253165748697476 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.23279761437533245, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0036609997549228836 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13420532702105284, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020736765057759775 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.447300262525524, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.0647434385662156 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_gem_xsum_article_DOC_summary_4.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..9c74b152d761bef6384eeb50192dddefe1695085 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.03916972701362441, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0025232037599719035 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.0705187151734879, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0041033703238095975 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.04587682793613896, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0026664431362576437 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.007496872523694719, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009023223955939198 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.013768613253728622, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0013735135943198867 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.008749872613988179, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0008910869873582503 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.03154543945422246, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0020528668246378276 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.05618648837737757, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0032188263348742517 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.03641897598226805, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0020590368431718546 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.031542117455926555, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0021071412880804725 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.055916896434064445, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003269542426299847 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.036286088799465356, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002099169574521433 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.6399540831907461, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.0665572258832638 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_gem_xsum_article_DOC_summary_5.json b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..36f543d526bb637b559f0ab67791ef7607f0f8c9 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/generation/slim.4b284b28bc4seed2_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0030262317078135763, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0008861957572341574 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.002682824319713878, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0008349754331976099 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.002797377262876916, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0008436395309397021 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0005864695792553728, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0003600452195293311 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0005925913708932577, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00039524060846512425 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0005852654722501501, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00037583234587724155 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0023057883289935395, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0006706823613650493 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.002115155017368573, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0006595785512806381 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.002169100825975142, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0006545600161608136 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.00240202126410433, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0007072328465422081 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.0021726632985610644, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0006770960348507971 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.002243893464585761, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0006801725997564016 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 4.294601973766167e-36, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 7.391409466573723e-32 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_0.json b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_0.json new file mode 100644 index 0000000000000000000000000000000000000000..1ec971905a50ff4b07dc4ed5108c1d2c5f09cf6e --- /dev/null +++ b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.318, + "acc_stderr": 0.014734079309311901 + }, + "anli_r2": { + "acc": 0.331, + "acc_stderr": 0.01488827258820394 + }, + "anli_r3": { + "acc": 0.33916666666666667, + "acc_stderr": 0.013672343491681808 + }, + "cb": { + "acc": 0.375, + "acc_stderr": 0.06527912098338669, + "f1": 0.1986111111111111 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.47649870543716394, + "acc_stderr": 0.004984266543053125, + "acc_norm": 0.6253734315873332, + "acc_norm_stderr": 0.004830371317841073 + }, + "rte": { + "acc": 0.5487364620938628, + "acc_stderr": 0.029953149241808946 + }, + "winogrande": { + "acc": 0.5753749013417522, + "acc_stderr": 0.01389189315026423 + }, + "storycloze_2016": { + "acc": 0.7226082308925709, + "acc_stderr": 0.010353267472010765 + }, + "boolq": { + "acc": 0.5501529051987768, + "acc_stderr": 0.008700950643028798 + }, + "arc_easy": { + "acc": 0.6077441077441077, + "acc_stderr": 0.010018744689650043, + "acc_norm": 0.539983164983165, + "acc_norm_stderr": 0.010226927233491506 + }, + "arc_challenge": { + "acc": 0.28498293515358364, + "acc_stderr": 0.013191348179838793, + "acc_norm": 0.30204778156996587, + "acc_norm_stderr": 0.013417519144716422 + }, + "sciq": { + "acc": 0.849, + "acc_stderr": 0.011328165223341671, + "acc_norm": 0.758, + "acc_norm_stderr": 0.013550631705555956 + }, + "piqa": { + "acc": 0.7519042437431991, + "acc_stderr": 0.010077118315574719, + "acc_norm": 0.7589771490750816, + "acc_norm_stderr": 0.009979042717267314 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_0_lm-eval_global_step80108_2023-02-15-11-04-05_0shots_backup.json b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_0_lm-eval_global_step80108_2023-02-15-11-04-05_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..1ec971905a50ff4b07dc4ed5108c1d2c5f09cf6e --- /dev/null +++ b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_0_lm-eval_global_step80108_2023-02-15-11-04-05_0shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.318, + "acc_stderr": 0.014734079309311901 + }, + "anli_r2": { + "acc": 0.331, + "acc_stderr": 0.01488827258820394 + }, + "anli_r3": { + "acc": 0.33916666666666667, + "acc_stderr": 0.013672343491681808 + }, + "cb": { + "acc": 0.375, + "acc_stderr": 0.06527912098338669, + "f1": 0.1986111111111111 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.47649870543716394, + "acc_stderr": 0.004984266543053125, + "acc_norm": 0.6253734315873332, + "acc_norm_stderr": 0.004830371317841073 + }, + "rte": { + "acc": 0.5487364620938628, + "acc_stderr": 0.029953149241808946 + }, + "winogrande": { + "acc": 0.5753749013417522, + "acc_stderr": 0.01389189315026423 + }, + "storycloze_2016": { + "acc": 0.7226082308925709, + "acc_stderr": 0.010353267472010765 + }, + "boolq": { + "acc": 0.5501529051987768, + "acc_stderr": 0.008700950643028798 + }, + "arc_easy": { + "acc": 0.6077441077441077, + "acc_stderr": 0.010018744689650043, + "acc_norm": 0.539983164983165, + "acc_norm_stderr": 0.010226927233491506 + }, + "arc_challenge": { + "acc": 0.28498293515358364, + "acc_stderr": 0.013191348179838793, + "acc_norm": 0.30204778156996587, + "acc_norm_stderr": 0.013417519144716422 + }, + "sciq": { + "acc": 0.849, + "acc_stderr": 0.011328165223341671, + "acc_norm": 0.758, + "acc_norm_stderr": 0.013550631705555956 + }, + "piqa": { + "acc": 0.7519042437431991, + "acc_stderr": 0.010077118315574719, + "acc_norm": 0.7589771490750816, + "acc_norm_stderr": 0.009979042717267314 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_1.json b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_1.json new file mode 100644 index 0000000000000000000000000000000000000000..8c1c302161fdeb86fd0aef761677c38617f14ca2 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.334, + "acc_stderr": 0.014922019523732953 + }, + "anli_r2": { + "acc": 0.321, + "acc_stderr": 0.01477082181793464 + }, + "anli_r3": { + "acc": 0.3408333333333333, + "acc_stderr": 0.013688600793296936 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.3390804597701149 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.4743079067914758, + "acc_stderr": 0.004983189711208521, + "acc_norm": 0.625273849830711, + "acc_norm_stderr": 0.004830628620181016 + }, + "rte": { + "acc": 0.5090252707581228, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.5722178374112076, + "acc_stderr": 0.01390513401383995 + }, + "storycloze_2016": { + "acc": 0.7113842864778194, + "acc_stderr": 0.01047831178564294 + }, + "boolq": { + "acc": 0.6305810397553517, + "acc_stderr": 0.008441557531799619 + }, + "arc_easy": { + "acc": 0.6224747474747475, + "acc_stderr": 0.009947227833469432, + "acc_norm": 0.5686026936026936, + "acc_norm_stderr": 0.01016275284774751 + }, + "arc_challenge": { + "acc": 0.29692832764505117, + "acc_stderr": 0.013352025976725225, + "acc_norm": 0.31313993174061433, + "acc_norm_stderr": 0.013552671543623504 + }, + "sciq": { + "acc": 0.889, + "acc_stderr": 0.009938701010583726, + "acc_norm": 0.867, + "acc_norm_stderr": 0.010743669132397337 + }, + "piqa": { + "acc": 0.7480957562568009, + "acc_stderr": 0.010128421335088683, + "acc_norm": 0.7562568008705114, + "acc_norm_stderr": 0.010017199471500609 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_1_lm-eval_global_step80108_2023-02-15-11-04-05_1shots_backup.json b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_1_lm-eval_global_step80108_2023-02-15-11-04-05_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..8c1c302161fdeb86fd0aef761677c38617f14ca2 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_1_lm-eval_global_step80108_2023-02-15-11-04-05_1shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.334, + "acc_stderr": 0.014922019523732953 + }, + "anli_r2": { + "acc": 0.321, + "acc_stderr": 0.01477082181793464 + }, + "anli_r3": { + "acc": 0.3408333333333333, + "acc_stderr": 0.013688600793296936 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.3390804597701149 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.4743079067914758, + "acc_stderr": 0.004983189711208521, + "acc_norm": 0.625273849830711, + "acc_norm_stderr": 0.004830628620181016 + }, + "rte": { + "acc": 0.5090252707581228, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.5722178374112076, + "acc_stderr": 0.01390513401383995 + }, + "storycloze_2016": { + "acc": 0.7113842864778194, + "acc_stderr": 0.01047831178564294 + }, + "boolq": { + "acc": 0.6305810397553517, + "acc_stderr": 0.008441557531799619 + }, + "arc_easy": { + "acc": 0.6224747474747475, + "acc_stderr": 0.009947227833469432, + "acc_norm": 0.5686026936026936, + "acc_norm_stderr": 0.01016275284774751 + }, + "arc_challenge": { + "acc": 0.29692832764505117, + "acc_stderr": 0.013352025976725225, + "acc_norm": 0.31313993174061433, + "acc_norm_stderr": 0.013552671543623504 + }, + "sciq": { + "acc": 0.889, + "acc_stderr": 0.009938701010583726, + "acc_norm": 0.867, + "acc_norm_stderr": 0.010743669132397337 + }, + "piqa": { + "acc": 0.7480957562568009, + "acc_stderr": 0.010128421335088683, + "acc_norm": 0.7562568008705114, + "acc_norm_stderr": 0.010017199471500609 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_2.json b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_2.json new file mode 100644 index 0000000000000000000000000000000000000000..46d433470bc966dba154e648c3e02fa10576b93a --- /dev/null +++ b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.315, + "acc_stderr": 0.0146966319607925 + }, + "anli_r2": { + "acc": 0.345, + "acc_stderr": 0.015039986742055237 + }, + "anli_r3": { + "acc": 0.3175, + "acc_stderr": 0.013443538681348054 + }, + "cb": { + "acc": 0.17857142857142858, + "acc_stderr": 0.05164277182008721, + "f1": 0.16728395061728393 + }, + "copa": { + "acc": 0.81, + "acc_stderr": 0.03942772444036623 + }, + "hellaswag": { + "acc": 0.4751045608444533, + "acc_stderr": 0.004983592410934173, + "acc_norm": 0.6286596295558654, + "acc_norm_stderr": 0.004821757734156732 + }, + "rte": { + "acc": 0.4981949458483754, + "acc_stderr": 0.030096267148976633 + }, + "winogrande": { + "acc": 0.5927387529597474, + "acc_stderr": 0.013808654122417845 + }, + "storycloze_2016": { + "acc": 0.7188669160876536, + "acc_stderr": 0.010395836091628112 + }, + "boolq": { + "acc": 0.6339449541284403, + "acc_stderr": 0.008425419107728748 + }, + "arc_easy": { + "acc": 0.6174242424242424, + "acc_stderr": 0.009972837790531477, + "acc_norm": 0.5942760942760943, + "acc_norm_stderr": 0.01007575554012888 + }, + "arc_challenge": { + "acc": 0.30204778156996587, + "acc_stderr": 0.01341751914471642, + "acc_norm": 0.3242320819112628, + "acc_norm_stderr": 0.01367881039951882 + }, + "sciq": { + "acc": 0.903, + "acc_stderr": 0.00936368937324811, + "acc_norm": 0.88, + "acc_norm_stderr": 0.010281328012747386 + }, + "piqa": { + "acc": 0.749727965179543, + "acc_stderr": 0.010106561880089782, + "acc_norm": 0.7568008705114254, + "acc_norm_stderr": 0.010009611953858922 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_2_lm-eval_global_step80108_2023-02-15-11-04-05_2shots_backup.json b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_2_lm-eval_global_step80108_2023-02-15-11-04-05_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..46d433470bc966dba154e648c3e02fa10576b93a --- /dev/null +++ b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_2_lm-eval_global_step80108_2023-02-15-11-04-05_2shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.315, + "acc_stderr": 0.0146966319607925 + }, + "anli_r2": { + "acc": 0.345, + "acc_stderr": 0.015039986742055237 + }, + "anli_r3": { + "acc": 0.3175, + "acc_stderr": 0.013443538681348054 + }, + "cb": { + "acc": 0.17857142857142858, + "acc_stderr": 0.05164277182008721, + "f1": 0.16728395061728393 + }, + "copa": { + "acc": 0.81, + "acc_stderr": 0.03942772444036623 + }, + "hellaswag": { + "acc": 0.4751045608444533, + "acc_stderr": 0.004983592410934173, + "acc_norm": 0.6286596295558654, + "acc_norm_stderr": 0.004821757734156732 + }, + "rte": { + "acc": 0.4981949458483754, + "acc_stderr": 0.030096267148976633 + }, + "winogrande": { + "acc": 0.5927387529597474, + "acc_stderr": 0.013808654122417845 + }, + "storycloze_2016": { + "acc": 0.7188669160876536, + "acc_stderr": 0.010395836091628112 + }, + "boolq": { + "acc": 0.6339449541284403, + "acc_stderr": 0.008425419107728748 + }, + "arc_easy": { + "acc": 0.6174242424242424, + "acc_stderr": 0.009972837790531477, + "acc_norm": 0.5942760942760943, + "acc_norm_stderr": 0.01007575554012888 + }, + "arc_challenge": { + "acc": 0.30204778156996587, + "acc_stderr": 0.01341751914471642, + "acc_norm": 0.3242320819112628, + "acc_norm_stderr": 0.01367881039951882 + }, + "sciq": { + "acc": 0.903, + "acc_stderr": 0.00936368937324811, + "acc_norm": 0.88, + "acc_norm_stderr": 0.010281328012747386 + }, + "piqa": { + "acc": 0.749727965179543, + "acc_stderr": 0.010106561880089782, + "acc_norm": 0.7568008705114254, + "acc_norm_stderr": 0.010009611953858922 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_3.json b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_3.json new file mode 100644 index 0000000000000000000000000000000000000000..7d327a82c41d33f5a6312aecd06e4bf6d8152b18 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.331, + "acc_stderr": 0.01488827258820394 + }, + "anli_r2": { + "acc": 0.341, + "acc_stderr": 0.0149981313484027 + }, + "anli_r3": { + "acc": 0.34, + "acc_stderr": 0.0136804957257678 + }, + "cb": { + "acc": 0.2857142857142857, + "acc_stderr": 0.060914490387317256, + "f1": 0.2849772788024592 + }, + "copa": { + "acc": 0.8, + "acc_stderr": 0.04020151261036843 + }, + "hellaswag": { + "acc": 0.47450707030472017, + "acc_stderr": 0.00498329157828904, + "acc_norm": 0.6297550288787094, + "acc_norm_stderr": 0.004818833521340352 + }, + "rte": { + "acc": 0.49458483754512633, + "acc_stderr": 0.03009469812323996 + }, + "winogrande": { + "acc": 0.5761641673243884, + "acc_stderr": 0.013888492389944511 + }, + "storycloze_2016": { + "acc": 0.7177979690005345, + "acc_stderr": 0.01040783447964767 + }, + "boolq": { + "acc": 0.6278287461773701, + "acc_stderr": 0.008454434247373908 + }, + "arc_easy": { + "acc": 0.625, + "acc_stderr": 0.009933992677987828, + "acc_norm": 0.5984848484848485, + "acc_norm_stderr": 0.010058790020755562 + }, + "arc_challenge": { + "acc": 0.3037542662116041, + "acc_stderr": 0.01343890918477875, + "acc_norm": 0.3319112627986348, + "acc_norm_stderr": 0.013760988200880538 + }, + "sciq": { + "acc": 0.901, + "acc_stderr": 0.009449248027662751, + "acc_norm": 0.886, + "acc_norm_stderr": 0.010055103435823332 + }, + "piqa": { + "acc": 0.7486398258977149, + "acc_stderr": 0.010121156016819257, + "acc_norm": 0.7665941240478781, + "acc_norm_stderr": 0.009869247889520998 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_3_lm-eval_global_step80108_2023-02-15-11-04-05_3shots_backup.json b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_3_lm-eval_global_step80108_2023-02-15-11-04-05_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..7d327a82c41d33f5a6312aecd06e4bf6d8152b18 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_3_lm-eval_global_step80108_2023-02-15-11-04-05_3shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.331, + "acc_stderr": 0.01488827258820394 + }, + "anli_r2": { + "acc": 0.341, + "acc_stderr": 0.0149981313484027 + }, + "anli_r3": { + "acc": 0.34, + "acc_stderr": 0.0136804957257678 + }, + "cb": { + "acc": 0.2857142857142857, + "acc_stderr": 0.060914490387317256, + "f1": 0.2849772788024592 + }, + "copa": { + "acc": 0.8, + "acc_stderr": 0.04020151261036843 + }, + "hellaswag": { + "acc": 0.47450707030472017, + "acc_stderr": 0.00498329157828904, + "acc_norm": 0.6297550288787094, + "acc_norm_stderr": 0.004818833521340352 + }, + "rte": { + "acc": 0.49458483754512633, + "acc_stderr": 0.03009469812323996 + }, + "winogrande": { + "acc": 0.5761641673243884, + "acc_stderr": 0.013888492389944511 + }, + "storycloze_2016": { + "acc": 0.7177979690005345, + "acc_stderr": 0.01040783447964767 + }, + "boolq": { + "acc": 0.6278287461773701, + "acc_stderr": 0.008454434247373908 + }, + "arc_easy": { + "acc": 0.625, + "acc_stderr": 0.009933992677987828, + "acc_norm": 0.5984848484848485, + "acc_norm_stderr": 0.010058790020755562 + }, + "arc_challenge": { + "acc": 0.3037542662116041, + "acc_stderr": 0.01343890918477875, + "acc_norm": 0.3319112627986348, + "acc_norm_stderr": 0.013760988200880538 + }, + "sciq": { + "acc": 0.901, + "acc_stderr": 0.009449248027662751, + "acc_norm": 0.886, + "acc_norm_stderr": 0.010055103435823332 + }, + "piqa": { + "acc": 0.7486398258977149, + "acc_stderr": 0.010121156016819257, + "acc_norm": 0.7665941240478781, + "acc_norm_stderr": 0.009869247889520998 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_4.json b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_4.json new file mode 100644 index 0000000000000000000000000000000000000000..a495c3d7cb4be80b0fbf74f463206b96398d1c97 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.325, + "acc_stderr": 0.014818724459095526 + }, + "anli_r2": { + "acc": 0.335, + "acc_stderr": 0.014933117490932577 + }, + "anli_r3": { + "acc": 0.3383333333333333, + "acc_stderr": 0.013664144006618268 + }, + "cb": { + "acc": 0.21428571428571427, + "acc_stderr": 0.055328333517248834, + "f1": 0.20694283133307526 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.042295258468165065 + }, + "hellaswag": { + "acc": 0.4749053973312089, + "acc_stderr": 0.004983492928102842, + "acc_norm": 0.6303525194184425, + "acc_norm_stderr": 0.004817227292240292 + }, + "rte": { + "acc": 0.5126353790613718, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5951065509076559, + "acc_stderr": 0.013795927003124934 + }, + "storycloze_2016": { + "acc": 0.7268840192410476, + "acc_stderr": 0.010303512765124683 + }, + "boolq": { + "acc": 0.6284403669724771, + "acc_stderr": 0.008451598145076598 + }, + "arc_easy": { + "acc": 0.6321548821548821, + "acc_stderr": 0.009894923464455191, + "acc_norm": 0.6077441077441077, + "acc_norm_stderr": 0.010018744689650043 + }, + "arc_challenge": { + "acc": 0.3037542662116041, + "acc_stderr": 0.013438909184778759, + "acc_norm": 0.3267918088737201, + "acc_norm_stderr": 0.013706665975587338 + }, + "sciq": { + "acc": 0.911, + "acc_stderr": 0.009008893392651523, + "acc_norm": 0.891, + "acc_norm_stderr": 0.009859828407037186 + }, + "piqa": { + "acc": 0.7535364526659413, + "acc_stderr": 0.010054810789671824, + "acc_norm": 0.7665941240478781, + "acc_norm_stderr": 0.009869247889520998 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_4_lm-eval_global_step80108_2023-02-15-11-04-05_4shots_backup.json b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_4_lm-eval_global_step80108_2023-02-15-11-04-05_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..a495c3d7cb4be80b0fbf74f463206b96398d1c97 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_4_lm-eval_global_step80108_2023-02-15-11-04-05_4shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.325, + "acc_stderr": 0.014818724459095526 + }, + "anli_r2": { + "acc": 0.335, + "acc_stderr": 0.014933117490932577 + }, + "anli_r3": { + "acc": 0.3383333333333333, + "acc_stderr": 0.013664144006618268 + }, + "cb": { + "acc": 0.21428571428571427, + "acc_stderr": 0.055328333517248834, + "f1": 0.20694283133307526 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.042295258468165065 + }, + "hellaswag": { + "acc": 0.4749053973312089, + "acc_stderr": 0.004983492928102842, + "acc_norm": 0.6303525194184425, + "acc_norm_stderr": 0.004817227292240292 + }, + "rte": { + "acc": 0.5126353790613718, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5951065509076559, + "acc_stderr": 0.013795927003124934 + }, + "storycloze_2016": { + "acc": 0.7268840192410476, + "acc_stderr": 0.010303512765124683 + }, + "boolq": { + "acc": 0.6284403669724771, + "acc_stderr": 0.008451598145076598 + }, + "arc_easy": { + "acc": 0.6321548821548821, + "acc_stderr": 0.009894923464455191, + "acc_norm": 0.6077441077441077, + "acc_norm_stderr": 0.010018744689650043 + }, + "arc_challenge": { + "acc": 0.3037542662116041, + "acc_stderr": 0.013438909184778759, + "acc_norm": 0.3267918088737201, + "acc_norm_stderr": 0.013706665975587338 + }, + "sciq": { + "acc": 0.911, + "acc_stderr": 0.009008893392651523, + "acc_norm": 0.891, + "acc_norm_stderr": 0.009859828407037186 + }, + "piqa": { + "acc": 0.7535364526659413, + "acc_stderr": 0.010054810789671824, + "acc_norm": 0.7665941240478781, + "acc_norm_stderr": 0.009869247889520998 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_5.json b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_5.json new file mode 100644 index 0000000000000000000000000000000000000000..c743f194a5a743a7ac9262648a36853868505f57 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.33, + "acc_stderr": 0.014876872027456729 + }, + "anli_r2": { + "acc": 0.329, + "acc_stderr": 0.014865395385928355 + }, + "anli_r3": { + "acc": 0.33166666666666667, + "acc_stderr": 0.013596836729485171 + }, + "cb": { + "acc": 0.19642857142857142, + "acc_stderr": 0.05357142857142859, + "f1": 0.19293024227234748 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909283 + }, + "hellaswag": { + "acc": 0.4727145986855208, + "acc_stderr": 0.004982346155911131, + "acc_norm": 0.6357299342760406, + "acc_norm_stderr": 0.0048024139199326545 + }, + "rte": { + "acc": 0.5379061371841155, + "acc_stderr": 0.030009848912529113 + }, + "winogrande": { + "acc": 0.5974743488555643, + "acc_stderr": 0.013782866831703044 + }, + "storycloze_2016": { + "acc": 0.7231427044361304, + "acc_stderr": 0.01034711289027693 + }, + "boolq": { + "acc": 0.6321100917431193, + "acc_stderr": 0.008434276591093021 + }, + "arc_easy": { + "acc": 0.6325757575757576, + "acc_stderr": 0.009892552616211555, + "acc_norm": 0.617003367003367, + "acc_norm_stderr": 0.00997492038453649 + }, + "arc_challenge": { + "acc": 0.32337883959044367, + "acc_stderr": 0.013669421630012129, + "acc_norm": 0.3199658703071672, + "acc_norm_stderr": 0.013631345807016195 + }, + "sciq": { + "acc": 0.91, + "acc_stderr": 0.009054390204866439, + "acc_norm": 0.898, + "acc_norm_stderr": 0.009575368801653873 + }, + "piqa": { + "acc": 0.7453754080522307, + "acc_stderr": 0.010164432237060489, + "acc_norm": 0.7633297062023939, + "acc_norm_stderr": 0.009916841655042809 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_5_lm-eval_global_step80108_2023-02-15-11-04-05_5shots_backup.json b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_5_lm-eval_global_step80108_2023-02-15-11-04-05_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..c743f194a5a743a7ac9262648a36853868505f57 --- /dev/null +++ b/4b284b28bc4seed2/evaluation/rankeval/4b284b28bc4seed2_5_lm-eval_global_step80108_2023-02-15-11-04-05_5shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.33, + "acc_stderr": 0.014876872027456729 + }, + "anli_r2": { + "acc": 0.329, + "acc_stderr": 0.014865395385928355 + }, + "anli_r3": { + "acc": 0.33166666666666667, + "acc_stderr": 0.013596836729485171 + }, + "cb": { + "acc": 0.19642857142857142, + "acc_stderr": 0.05357142857142859, + "f1": 0.19293024227234748 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909283 + }, + "hellaswag": { + "acc": 0.4727145986855208, + "acc_stderr": 0.004982346155911131, + "acc_norm": 0.6357299342760406, + "acc_norm_stderr": 0.0048024139199326545 + }, + "rte": { + "acc": 0.5379061371841155, + "acc_stderr": 0.030009848912529113 + }, + "winogrande": { + "acc": 0.5974743488555643, + "acc_stderr": 0.013782866831703044 + }, + "storycloze_2016": { + "acc": 0.7231427044361304, + "acc_stderr": 0.01034711289027693 + }, + "boolq": { + "acc": 0.6321100917431193, + "acc_stderr": 0.008434276591093021 + }, + "arc_easy": { + "acc": 0.6325757575757576, + "acc_stderr": 0.009892552616211555, + "acc_norm": 0.617003367003367, + "acc_norm_stderr": 0.00997492038453649 + }, + "arc_challenge": { + "acc": 0.32337883959044367, + "acc_stderr": 0.013669421630012129, + "acc_norm": 0.3199658703071672, + "acc_norm_stderr": 0.013631345807016195 + }, + "sciq": { + "acc": 0.91, + "acc_stderr": 0.009054390204866439, + "acc_norm": 0.898, + "acc_norm_stderr": 0.009575368801653873 + }, + "piqa": { + "acc": 0.7453754080522307, + "acc_stderr": 0.010164432237060489, + "acc_norm": 0.7633297062023939, + "acc_norm_stderr": 0.009916841655042809 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c697184528aa962bf54a0c83032b69160d55ddf7 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12cfa5fc715dc7c8508d271c80e45632c4248be6ae83fa3f393566dc799f11ec +size 199058647 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b747fe616365960c76c3ceb8658b3804bfe55718 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0411ab11df68459ccab0fde44db543c628d472b63952716d8884914d845e4ef9 +size 199058647 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a612e728815e2a3bc14e7af6a316065edff273c2 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77539b2005757dca4abdf6a49a74afb27684852a9c10da2dee5a5546d7f11b55 +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..776d144e9378d3acd494cf5a36e901e3ac6fd586 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2429507947e50f16956746978608e3b95163e93dd7117935c47bcb80d248966 +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec3ccefc9ad85fce198599e9657f7f38e9d80906 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ea2cbdfee5cd99c974b9f298f6a7b0606c52a8b46f8f053d8034ec7cc0ad637 +size 199058797 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49790c0860cb34c097751e9a399db0d64066365d --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9dc9e431ed051eb298bf10fd166b8d885ac49da6d97a5b64c02fad71716aed2 +size 199058797 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..452823cb001024433fded77dc2f688aa0855dfe6 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:293ea88b37bb6769c87497b0993477fe01380b889f7449141cb0b0b68accf0db +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc40961003e87342fb2ef4413ecd95160bce180f --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d232c095d18594db3f64c02c76b45401ce54da01389d984e073f7af4715bc72 +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38f99748d6eb6d6fe3d9848486bbc68ae0f5039b --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf1f8274c36b9d1269a4594b4c1f4a769f988098e5e9de0e3763c391184844df +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aba112271fb557f8db98aab5237ca00cb62cc8c0 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:115e33d3ff1a2ea69cce4fa1e01c57135b4657c383a5c1024f3057e22bb05766 +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c27a39ff5cbfe8782bbc37982ee1cf2fb3ce312f --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1a593e9309d0722bf09f54cb123f16f996a5888813895f12408e544944ae1ba +size 199058797 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..985fbb360d7e70118e6ac8936f2b92115f00e1eb --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65c047b939b3ed46aa47df91798fcec65695ab56f05f6cfd2e28305323a46a70 +size 199058797 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8996fed0ad00fa329201a53a6044f673abd39e9a --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbae5439900eb8d44166e0f87466b78e4a9944de4f31a4a6ffbbb32eaedaa39b +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..450624589f222898c8238cfe12a2b55a6a1b7db7 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e214ad4a8ba108a8515c31906d6ebfd83ff421e3fba48e2987cdd42f54a1eb19 +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..439d3e6cfa6296b23421af3fefeefc87bc614055 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:013978884dcbe1a2112d4f170169c2ad02b7335ac45dd6a170548ca7ba2ef501 +size 199058669 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f97d99e6c71e86323da7942457ca5f10cc91219 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfb7da41a1be3f19ece416c2a36bc14512c988b5c9a4aeb26cb040c69a45ab3b +size 199058669 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf129e0b6c0017fd6a7dbaef99cb54da4602b6fd --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2ec9c4fd4cb65f577a8388cfbc9a94ba43c15c66dc34bdd6265395d710156c1 +size 199058797 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99c6ca2e0d7c45e5352ba5a84aab50e1d09a3e26 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74ac63e19d0eb8b89606369832a951adc4ea8a7282bcc2ef4706217338731613 +size 199058797 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4922f9a909dcc862d222a5b3bcda39bf11e30be9 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6fb6fce4369bc00f7b551db30a265c78776fd0217d3c3d4a0eae33f1b245e8b +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2449384b43d279489f311a809c3e1951820e9ce --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a01e8e59159b70ec791616e8eb6fcb293080f965907762d90989007c24b86313 +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdc5a5e7039cccebf25569b9d491e428a2410dae --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:341896d0d952383702551f6d047b73e667a30533875bd6019fc78e36e3b39555 +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a10d84682bcab4ab47f34a2b51ffb89cd540a353 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6153d2d064e2e6088094c973fe2864cebdd566f1121fafd5cb96760c4b195f02 +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccfc38233d1a8990b01f9ce50077522cfe45fa68 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2820c1d32f011c43ffc09b83ffa662b6270be5603dc53b15c91830f7badac2bd +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35a9d4a010cbf48787740aac5395362e3e582c66 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3caef33b9f7ae3415fe45cf8ec45d726659745eaefb9af2d7d902890d1900eea +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5d71fbfaa902eb9aff4be95ea73721de4227f2d --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e25c40dacb863c7632608000b5ac0e9c7878af11143804dc131f4e4969bb45be +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28e19cfaeb361d5f87e52a8387dac5adc89f2acd --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51ba3ca3b64850ac4857320e09f22b431d000e98071e5dcf9fe0fa09d9bb910b +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65623f0e7638525f5b77c6be4705e46262be4f3e --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95d5255dc54f2d9958a53aa50b755e5a5fb0a978ec7edb873c28fadf26d6bf62 +size 199058797 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bcdf53243b81bc2e7d48fa9322a67f9326d9b9a --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17f4fe1cba99ec409e6033e5a55ddc27b64d41583b5569ab08fbad092fe33746 +size 199058797 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31d0273bcdec9e8d9764c5a819abd0a3b78e1f3b --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec2b5032631187d94d694f7cdea5ce3fda07198318a5d596cfd78bf47e6e126e +size 199058605 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f2ad0af97da37fe3ea4ca7cc783d5d3fdf57960 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:309db82b85d46276f40b5ab6b51ef1c9044341477c8343c492dfc1521cc152f4 +size 199058605 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a80e55ede2a9341af863fa589b7c363fec80dcf --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ea6433a99ee147bc46ceee27f8be26f5d01df8e946e9a0cb0c627498d609c8c +size 199058669 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6d1433fb47c222354097c20936ec5418bc5b959 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bf45643be6d988c23fbfb7e2fab9ed9fa64a9f932d02dcbb915b54e8ade1528 +size 199058669 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ed6156e685b856691ff668a87d5bbccd578e06f --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a82dd97223d8a685df7c52b8295aa225af5dde99aede731d380b3d466f407268 +size 199058797 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5244220482f84d93b667d7f303b4b94f57dc189a --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df0ab866c3163075945fca84776aa7d7a0675143ded7b0b08074936282adee52 +size 199058797 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13d5160e2822268b4913ba9416845595dcc2c562 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dcec716edec5f2d90486237ec99576005295dd0e67067f2c40f59315d4037e9 +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a6a44633d6a0e194538ff09ef898c3538eca9a4 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47cf1658108a2f0ed5ae4409c47e03a4cbcfc3f5c2f91b59789c39d558e5ffee +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44d28010b2b0613a0dd778ebb1fdd99960a2ea5f --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36ed45970453b179dfb77d46d8a8343fa620d335f5d6b6183a2b05d4af4060ee +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fba6f860446853c4f6da79fbad1350fb30f8e64e --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08182919f8252e0ec47fdcb9acb754f7e61d67f274b34dc0c97f702f8998b45a +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f8cdc33ad66dfa40a127ceb21a7cd771dfd252a --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a27342f0ec04f0f27571527d880cecde7edd744a0e04546f6e9642e36a2ae2c4 +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..293f337d8283fa1ba758feb4404471fdf57eb251 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dde0e8591baf3afff60f40151f00d853bd7a2720d6d1956d7b05842d9eb70cc8 +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a2a1075d759d671e0ed84147d0347342477dc98 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:057f060d55d13003c0f21f11c0d0e7248ec8faace7836f9e9cc1ec0bf0c612cc +size 199058797 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78d724669ec804345395059ef5a540aec6f24123 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f156990fa9d810b3c83f1cde86fa91f017774f85c2e43a623649eba224dab0a8 +size 199058797 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..148fe594b1dc4d68caba8b1bd8c67b90c5d6382d --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:877749938190bf71bc9baf792ad6f97d6cc26e833987c8bb342847706297930e +size 199058669 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68cd785d2214575e4113b8ccd2e7c08c3b2c1861 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be9b21f514e453f713303775989b1fe65b551c53e40266478749ea083982c440 +size 199058669 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b222d8e861e2b20decee0fc9d0880921d594ff8c --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d1a421d923a2a882b00191456aec68b741f70d44e50cf2c6daad9c7ef51dae8 +size 199058850 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3d2fdc50a8d07251ffc0f90a70472660f591177 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11e1583fc38b977b8b1bb5ce608eb412476df197ce6168a311e8d60fbbdd32b9 +size 199058850 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e9c37b0d93cc457c4ad6133ccec930150dfe74a --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9eb075494cfdcec7cc0d36ec0d5c43fe99aa68dc1e00f473fe450886a7bda8a +size 199058669 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b6557f31f1a79d8a0c3c03235fa9bc5cf3053fc --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7405384bf8e38576e781e2479e6a95162ba1877a22753799ff713b9a42ad044 +size 199058669 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a27723021ccc2e4d7feb248e26d99ed45475781a --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dab9ad1e8f57939693e79781521c23a4e7c55256283b847efed5fb8c4a87915 +size 199058797 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26d751905e86294aa0deecc3717512e36fce673d --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2979325a3fc3b97fae6966b6a707f701cdee92dcbd9871e4cf8a77c55fa4c2a6 +size 199058797 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..168dcb85672fe401f1a19e4026553b4269d37364 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:167f80cb4162e680060467c32ff4a939013d54d53001a54afb2f184c54e790d2 +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e411024ecb5e99912f42a93bba4cdb8557192465 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0e423d06b6e556e73866a45b4eeb0af9fc5ae270daaefa60c3bf9b7ca6454ff +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f20475e52d9fdd793c95e829462ee61d115dbf9 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfcb19d162d5c65cf7223eb1da7b5b4131e8597eba380f69c10cedf65865ab54 +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bf9713d9fabc326257101778d8fafba5cf07479 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b90c81bd9ee55c63eaa5801bd89653471fd87ac3a1fdc9669e97c1b13c29b334 +size 199058733 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7160b338fe807c6ea874264513803b7705b2192f --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfbd5c4efe5ea5dbefe09aad6bd17de2567522aaaaf79ecc0ab942e0bd5b7827 +size 199058669 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6537f76fdf27e7de0ac2bd6eb05eb00cb576738c --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2e9b6ef600bd85ae5d1c62e1bb900295b4fdccdc34621ced25b56c76d925431 +size 199058669 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5b643b88ca47e693b8e8f06824b0b41dd252bab --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ca6578ac9643667629175cd443afe3a6ea0bcd12f1554083e86d21a89be3b76 +size 199058925 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91f1a3e8e53ffcac152cadf27a5ef952e70bb510 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f68e2783805ebcbedb55d42b172ba2215769b9826f4354da1bb82e14449cdbdf +size 199058925 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab9250705d2651d6269cad933564e7ffe01329bd --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0272fd3de9e94601b153bccea5cfb4849c72e50835c48b0b641d9ca4e734793 +size 199058605 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..896afbfbbb68f34073fa2a89b7f3f9ee51f09bfd --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caf55fbad014fcf90db459116a16a21dfee63d430d1b1f456375195e19965477 +size 199058605 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..455ad76c3c0be17b5910739878e21528254bcc85 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:022ff4c2faab4cf9acd1c68199e280bc91906876ce1a3e3474645f56084a989c +size 199058605 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4b34a7001eb572aa5593bfaea91bfafcf12cb90 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de0344f77a9571858b9631fba27a47ab05973b204194458d524366d95d24dfe4 +size 199058605 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8d6ea3f9af69fe8734a2c41157f909c76ed67e2 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1cc095c8a79a8de2e77229201f7cfe59f4eae2b912506db48056b045367109c +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dee27d6ce2b567434ae99259dadc7f25a49822c9 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbc988ff5ae151388cd03642d1ef6d00e3793a028cdcb2ccab873069af49584a +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7726fb96c105370d57b4a309cd84f7d6556651a7 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f95891bf68de1e6d0058d34597b6635d368d99256da934ead3a1204db4f6031a +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f97426bdc3a226936e9923011b395ca2ff489b3b --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ca6126a94e828f8bf1d75dc039dff567aa32b87da5fd0fcc85b3ba568040482 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a784ce3edafedc8e7b508ed6bf985ea41f14376 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d71fc356ef2fb5c4bbc7bbb98099ba12eaa392557854754ed160635d92dbb823 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8a4cdc72253f40078c098f34dd1261e6f4b0948 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52e6074769a875cd4c6562efde958719c9b0608aa9d572245aa918863d26f11e +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b03f98fc2a2a4de78606bd76e64c3a58b777a37f --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de6a6a34d80a6de50d5c352a4ae119539dca58ff07d8c12ca06a75f2e84f725d +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1d213f106831b94705d012cd4927faf6508fa83 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a47d3d43991751012889a3b42d7d6fdcaffa97583e67384940df2956d037e1e0 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c64171fd69dc6069ef9100c4fe34236d28380936 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3028b07774e7f916da3b8e24448e8848c136aa4767a2270c946b71fdb0366e05 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2b91e7e0f1d23b2c47c2c09af51d0d1ef9b4656 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c59900adef68710611dd1b3787cf4875ff6a17861dc06882b159cb4c79a16461 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5425b0a3ce5b668ed3a66aa36dd8151d029b2b0b --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:829ee3b3afc8af8b666171296e40c0489d13a9486e3162cf7708289a285f48f0 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed3863824c38bf2f13715ff3568239385e8f548c --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c075bab962ee11e3d3d3beb2958ce2de80ff37d1fc395c9ed3b2338e6a6fb917 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..859f39aa3a06e6ee7ed0cdc6b9be639e0d050155 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b9f85a95a0d5a532a031dfacb810197d6d2716da73ddeb79f731a40dc32e6da +size 199058978 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7bc2df43c788d31fd441a310dd4cd25d8f65ac6 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7638f984c77ecb3af5af751c23037e3cecf7fecb0b60af34f831d850c9dc3adc +size 199058978 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7fd58d8ec1dd569442dc7993fd17921adc3d1f6 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64e18867443c072826bed8ed44940ce8c4dc0cb4aca8e6e283585826eeffcd84 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31147b4b4bc5d12100be09c5d87458b5414c4d58 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9aa6f5134106c1cbf7456d8ddc7b90e33625d4889376698441e46d17c726b0b3 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef1faab455ac0006bf1eebc6e507ce1f196da8fe --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f25d655e923fc90b77d489d82efeaea77488e5fb16962e4ca20df6647e58a0e3 +size 199058647 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1217dd634ba8c2fc8f846513a04532ab2b7e63f2 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aadf21ef5fa5167c1a8e2163243a29016282ac0e50d31c7c8e6cf57a9f7c7fbd +size 199058647 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef9e6e662fab5c72efadb7e6dd135e60cccca7d5 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c14194339a56425ec526f8c3afd0b07a83edd05dae056db31d05e8f930236925 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28e606d344abd802fe541529f81147af8e695773 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c7f3da4b13f6305dc58a6a4c8f12dee89573eed8798050099f796758c5a93ca +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8353d8dbf3a42cf8266927618c5b4d5a7048e06f --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85676415b6953f8a22bfad92f735736f8fce8063d4ac253ca38d872ec75930fe +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..600af14f665c1a1c2549650e016bc6276051e678 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5649e935cec2c952a7acdec8b8f23ac62bdad00a175874ebc7852078355826ae +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab308efb92a4bc0c2fff44ae8022564f8ed40b96 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcb73278481b6ec377fcf6e5fa7cfba928a3859f76b41618b324852817591d0c +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b0d88e7e3956c87754ab7dcdb226cfc28c1d147 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:750e79928692e399a45b4d387bb59058f70869e51d72bb48674cfcec8143356d +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4189e1acb8facf706cfd976873a751a16e5b49af --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94d920105a75b7b3f6cc81ec261470266e2b02ddda3d7b5145f3ec4b4da55a8d +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a6fb846e922bea0a71b8088d1bb7629b6b76880 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75d2d7897d2a8dd89b3a62bb5f6bfcc2d73815ed9ad8a41d10db8a3b78321f05 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a83416b1c53ff1ab97f0788903374627e34beaa1 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c0d8a7f7b82cb50293b9934acb6fd4e06cdc1bd821f73d18426d1602bff4fa4 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80cd4d159f5fbe671f154891f2a177cd3ff82feb --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d646d66296f30ecc6de0939e813145eeba44baf787036687ce9560ad1e0e4de5 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79e9f28557161eb187b4cd42fd2aed34c0cb1807 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38e8c8570b1539e26e5712c6c8c5f26ba1702d991702e10644a1a051c8a9bf1d +size 199058850 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce8a9e1189395d66fd9357b04d43030f7ac7a127 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9124a7aa8334fffb0f2ea6860dc64bccb4dc4b56dd3c26179887d18c61db8dc8 +size 199058850 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1797d16b092d8bf4930f2dedacd96eff936d3ff5 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d011c16b7b758a3a69173f76c87b2430e022dbb9fb573189ea3b3ac814381e0 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a373ce925edf0018dd4100e14d52407046d77e4c --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe5515e7d26bda4d242bdfc44ca12de057ce70e917fd220c2b1a3baaf11d7ddf +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7a629cfeebda35c3e7aef195614f7437d1a527f --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98056851988d88adb6308833883ec9523c17c6905bc4658a7e5ba33585c1d661 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eca41bc2b994bf7d83aef3d9938a763656184f90 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12ee25931d5bebaf2004487903ef7c5fccb0d1ffc3dc9ca79186f56265940460 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1646748e65ac8f6c905d77f21cfe3d982b54765a --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d12ad2a59005332198f5f86dccf4f21a61435023b152a16f8fe913d8602c014 +size 199058594 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6da3c3ab79607ecdbd200fde10ebc0647a46e740 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f8c90fcb87c6a4553a343281ef526912d135513a1c882b74c93b458bf949f03 +size 199058594 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4064395a31763a80a62282dddb0379e5600e748b --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:916485c4d77726177023f3d275036a9414283ef275123501527c21929642d48e +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f8ebc9cc2dc65f9728ea7f7d5529c5cad5dd5b1 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:757a612d299946280c5e976a70825ce163f4ee01c1b7ac77606e21e06096a95f +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92d0f2a7ea172450c2469d4dd492fd8981309ea9 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d334952a17e1b9144a4b25a40492ba27e4c9b3139c06aa75693aff9de699aba +size 199058711 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3e310d33409d206c335e53ed4264e599d3a9e31 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1884e616252d4c7637b8bb43891bbe039e2aaedb517ed50a29e80e67559e74dc +size 199058711 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3f6f9fff82b7c3a08b8be6bba31c3b1ec60a0ba --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70da02b9b842d3457b29a582fb29d9d9c6308ad8997cb2539e688f8a5fbe42e5 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae5a29ea57665207e83fd5b1dd862df1e928da8d --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b04b546437c58733ba6ce93f8777d6e6980fd386f225f53ec2d2f3e8c41dc646 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6c835d4e7ce7ec1fd6cbb1ee929f13269ed0e1b --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d1561c58feda09caddab9f90dd26e7fff402a4718397b6d0da2f7d250a5d363 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8415149214acb059c18d0d1cdcc6be8e83500495 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4be0496d5e2f97ceb063a7a2b215a08ae7c47b26ca68febc36f849e4213c171d +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55c56913d4c8f344215484e475fabaafd64d3f97 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:713803166fe4b148c13886a0deee8b9ae88f016121845bb1989b1ffa57a9ec66 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42245def609fcc5f5ef33ac6c711bb49ea2f43b1 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a9b650de33588c06c5ac8ac3453ebafe0c449a89f7e570cbea9c9e6902e0a0d +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..215a3b28c4a244e04bcee178e159f055ecf3530d --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b9da81c1cc33e6bf00deb44d3de8621c5ad89b7af497e49e0a48bfc9a7b89b8 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a38581d4c1795b45a606abaa3ebaf2ef0ad3cac --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd8fc82d675ef78c862dffe8766dce9726cd2f7e3f8662a79b8db63fee6021d7 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d9f6a1d2de2cfe081fd3ce4f392a5ae358c7d37 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6981ea6167ff12c6b3eaa39d2b3ad0e3371322992fc3309597078ae17b5bc872 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bb1ba6623a591ad94ee5f6326a2fed360fd55d2 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46aace5cf8831943fe6ce2d5957054c2b547b39e0fd62836b29d76454527757c +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbb0b6b613d16965cc1e10c5885d1901d033c023 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dca3d7c66bc80d34a3c88420df4114d1d06b9bb5a084b4ef98019fa729c83c1 +size 199058594 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f227ffe2e67f040b45574824d31d94174aea7b7d --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad3f02733d8a0b6632468b1b4718f982eaad524ea929aef26aac3538907db8f3 +size 199058594 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cee341b4eac089adffbe9a3445568012a8de881 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9873afda7d9633046d6f7192a2354ec4096e43bc7e0d33429e242453bd4a0e52 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..655eca5fb66c7a3739b69fbdb80663a4ec8a32fa --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:286643b00ca3ee798f56f5623341821e71065255e67765485e607d3f7baf9c20 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d3628d9e106bf37943a8c550222f1b56983c08e --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32b359032453fb99ca269ce99a167af6a294998be149353f7f01af015f4dfb1a +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..067c50e96006aeeff10fb86eab9fb63e2d8bce32 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3871ea56fb4b5aa4d4688104bafed6abf6ca810d0e47ff3258fa8c96f22de74 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..321299024018f289f672a273d3c502f622b70b49 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7aa3bd17e836bea8536969b5b8cccc7deedd42312a140fad70b7408362a3eaea +size 199058850 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d28393fd73c50e80d859a43226fd04b59c26a039 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88582097f51662a9df095495a63268647a4d6cde2b925e519235afdc2687126b +size 199058850 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c473edbe5c8c074be4786c15cc78b2d8f729b2c0 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a2f4b7203b7e15e2e790fb30ccf61deb9581bd2edcc3f08e9629e341571e5b6 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6edf16516a2540b1eec1e225f907f27c7f2c47c7 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:118673f0a39de59bd6382f0a7c2eefd83f9b60b74a7df52868af0e7165764685 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..014df94f11ebb37ce3f4261bf5906ab0bc242882 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2c4ba164af2af70dc4c227746dcaff74a19e5296d76674ad5908f13c79932fa +size 199058647 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b940842e076607cb7babd76dc1a4ca40cc71dd3d --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59b296ad439f6cd75b88575ba0a342e092cd4c87c793d867ba19baa1c14d3757 +size 199058647 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e111cb8c450ce8039ad006b0f2ac808473da8a59 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ef0efa4c1f89034f2e3d96f2ad597b5c39483816cc8034be559f4da508421f4 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9ce32d94f57743d8b013c2809f2da4665d9aaaf --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fe2e53d9415eabb549acb161bbbd88ff6d17c03009139ed784445f7fed4be15 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ed7934720c04d8016c993be1151244f3781547c --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cca7ccc91b4307c4615da6d6a7da702c5cbb6c925874d7cb1eb81d616a9b564 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e187a1dd831de3d6fb3a6c4cbb73210b39cd9fa1 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2446ba56a2658001e2a8217e60486e2c5f99e340ca2fe60db69f6abb796119a3 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70e455ad72fc842854a88a304dbc47188f8a17e5 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d1513048031f74a2de3bfe52d54f1d0075539539671a7fe0556854eebf93725 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23761ad39be7aeb1875383a8146a4450aaeb0d14 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a09cce6b5f9508baf3b93ef25fa943fff19041dc8ea9276526b279601592878f +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fdc6cb0bdbac8a991e99ed388bca17e419343cb --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0be5c7e97b75562b28e4721472d45b1ca6ba61c17fb5ed1e2416106d8b94dc65 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2816ba77663196cb0b8fa0de2f03729a35d5b60e --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa21147d8e71da3485d34567a219688344d2810849ea82129614c57f390e9d3a +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1b082f3c2fd3a658a6649c975e609a1ea3c2b14 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:344ec5c5891cbe5df39e69a1138df24b417a588ae2d2bd543b8965d702d699ba +size 199058850 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c4cdd178fb159fb7d85f1b990e5d0ed33721ef3 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4210a6e6c571c5eef13d30dd4d536d297149d4b1dba31ee83d3367502fc43cf1 +size 199058850 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c968f902e8819fa28b840889d047b2f54e78b0f --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89d7cf6ea2dc94719e582a353b107dc0b518da9deb5fdcab484f5d0ce9d79b96 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c3056eb1603762180bb8cadae9dde30a07481dc --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd79e95883d84f8c422f1997e7a88a23a5b045f42371ffcfcef8933d6a586d65 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55263f9e4151c39744e070b7e726e8387c414d31 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72be33982067569ab18f46f83033ae0340aefbf73d98b8f50646e02ad98b025c +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23e49af5dc231407c5334008dbcf9809ecf1f9ce --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78969ec11a556eaac31dce1efaafddbd2d2f5c1d7ad0a75d315a7c03d8e6a04a +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..717ceb9f8bc8b03c304894665039633483a6abef --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b923de12c9536676f3114825ad0d17b3ae7fd9c742d81ef756dbbf56f1a6c562 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61b12ce0630a21c1574248f5b7d8c30bf4bbc205 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94ef65dbca5246b4c49c4cb627df827772953a9cbf6ef7fa8897dc7b5b6f5e18 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83aade486ab81c03b7dc32cf9cb8ae10ce23a86e --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d65f1b39088c38a71d7d49fe3db7efdf707f5b4cf5a7fb4fcb04152420e6400 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86a4cd624f08e86c30d464de790c913300f6d1c6 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d01191eb4593b827f69cd41bd2ac9344b53faa953ce728389dccc1d6756fca36 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7e7862a6e0a92aeae4f53283e16f572cc5eb78e --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cbb30ed359a14fedb37022970d46e6d3c417876c6f4be3b9bd1f73a24c59227 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c94ff677a292f4336c328380da3d53b61c40dc8 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab5e016fbd082253a20deef390f84322f003699c9464ad1c9ad336e5caeffa17 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cbf5f42224258f753032f1c2b79630149ccd9b4 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0aa9468b1a76fae5835c34fc4d716d4be33504f3b318929482ab3808c8df3f8 +size 199058775 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd7c213882c8f9ac6bf176ce93457657585fde98 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:849c672dfcb243447f45062e73ed3fc99212beea6378c2cf1cf683b4632e461d +size 199058775 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2085f7b1ccf9c4cede55ad741352d7aeef861850 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34ae4cac8fd6a2609a6756763a0c0048a75b33e1cb9aedf9da369a1c3217452d +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af3e5fa923baad16e7739970d456b1843373102d --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fadb2097d4741deb876d4d2b5b9035ae8936c8410458b32c087a3f6f2e0931f3 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06399ffa7f8122b2303f1459e3c9540d42daf804 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8346cf4a39a0ef5a80bb81d772ad9d9ca5f6d01968e97d90ebbc2cb264a28847 +size 199058850 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0baad4c26a2313dfaaf46217eae39468958fa43c --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2db993f174130c08f9dba1f8a8cec828861723423e884c74abb0aef4ec82622 +size 199058850 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ccfd9793bdb730bdca06c0397a0b79c6da18faa --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81904455cb2d7a2a9bcef247a70f9a115ab42efeaba7ec1e852e48ba6c840b1a +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a2e28a20e597bde7a1854731d87e06495184080 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e284ee13b6a05684b2fdeb2e9d2ae9f49d9566756d0f5b8687f296e9db694aed +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f5967ecfb2dca2b54526f1a6ee1aac381eebc80 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45d634e0472d2ce8528ed120cc82763931d5655cdcea5a44601313ab6ffe62ef +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63b7caafc56afdfdeee1b9868ba7332e4a5f7291 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18db70bd442fd01ddeca0fead9bf4b49f05b372e3adad5ab0d382ebaf0ef1144 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70ef918a98da9a36b2578d8238b790a41fa3e2fa --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6da639cff437cf32eb72367393f4c140ed2e9fd191bdf1ca9c6c1a43e89062b7 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4e71c48a7e2aaa33546643a921b13598284e844 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77b9340a972ebba92cf319b29c61271403830be764e69cfd5e69e469d4efced1 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..782f99182b80419947f3f2af822ae444a5fcbe93 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac869d5578baf9c6e898b3843bcfab0a7b8a9b26dd28518c8c2be48f09c0b9c4 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ecac93ae49ca9f881edaea019468e34fc9e0ec7 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0df5e2b566bcc2eabfc1447b75ffff25e299142638f2b39cac40166234299bd0 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9572996e455682c8d58724342a54d2e596fa0356 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5143fc830a9879027153da6c9faf39d3efeb42f408f5cbbf3e08ee2a49fa110f +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dccc0748871a125d72d638f5655d0572f1cf726 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d73d21dfaa90e5adcc678f7680464fdc48ded5595fe7c444e5677500a4244da8 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8428d8224d2d4fc0ad222695d7057b98a60c82d --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:629b8083346f249ada114c800b1b8f51e3aacb0b65a355628f497f34f551b46c +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6a39696fc513233702f7e1d7f897c56699f4786 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52da06ee222f1957236a0714da79799ee09d371d775eb7dd3ceed42452f61fb0 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b0f10a0894912b6a5ea4a92204df4cca08b4704 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f577cd3ead6e8cda6727dbd73410fab6a594c2fccbabfbf00cc506bd8384758 +size 199058914 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9677b4367f8cac6a039b4b1836d11882430f5f1c --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce716df35651d93f2823a4ec5e27ae8b54f3ff5329c73a4cff38289ae9a20761 +size 199058914 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57d92f09761fb372a851987c12011c57a5b21409 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d6de10fb50173ee0ac151277077f807a6ed2e2c27934414f10ae386be81b6ad +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b4129947dca38ece2b115f1060aa20f75716ba5 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:899d742af26c13ba28fd6996e0dc2fb70553eecd4f81e42feeea268c02182da8 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47da92683db7428e268c0764ed4bd5a99b0e64f4 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bdf8b9a84370105280aa733ef437edf58d55ee96f8ebee6f54febc9d98649e7 +size 199058711 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0695bfdc8c9abafceaf568a482493c81a561266 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:366af052f1f44c55dbaa966c565429b8f36574635363081b9eca241a94ae3ded +size 199058711 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3666a7fef19512d13029f422ef9fbe1455a0fac0 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:803fd54ac9005133f93de2c5bb07d7418fb8bbfafeaeac42a8da7fb0c06e32da +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08b923920db02050811b032db6e89f70aa3478ec --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52b51e40729134e8359a46c0f6186ea0c73f486bc43258cad0228af5d77254d2 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d932a5429ab5a2d9ec337773f733dd8937b8ff1 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a4b02e9a10e3eac0a3e97a83d7bcc3a893aeec31eda16cdc5d66bdcd03387ca +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db83daf6ac9299bb7bb80a4073f2c4d2733fdf80 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16bc64d36070b76c688c6241ad3c12faac9181fc75b3aef0bc68965011052fdb +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9ec9fec53ab7cfbe01eac7206ec8cb158025ea5 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a1451c9e0b40fb7a22b66bcec1f00373b1608e920f6b8d40124d3bf5cc2652d +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d654552cb58bfcd85d1a3b2d9d835d39bc355e25 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f37d001a80a336885297006edb1eb92a693352e68246f6a9f7c46d9099be1ba3 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef280b7d12bef73e8b53ddc0e5ac098fc8b026fb --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0752b911a79687644313cd62f042a35e607e1bb08df7de9ca2425053d0519d6f +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77cb883b817f520ba78b665e2a8eabcc89491d33 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:141148497a22c1967cd75799c97e5e4c3a24a09d03fe65d601a819039b498193 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd28caf605a235f7fc2da63ae22fdde93540ee71 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa1ceca1f86f425372d6945b55614622227b24eb700e7cae8d0a660d304d7ee9 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..448edd685c00aa892be94ce8a12fb5a4bea5a6db --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1cebd50b3254b16a97af76c94d62ecaca4fc5d090bcfb866aa20f799d94d53b +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da25ac6f131de8df645a0c9c7ca2b90c539e2eaa --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c7f5c929c5ee2f5c2a259bfaea09b007f48626f68bf05d1026c829f29f89c9c +size 199058850 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73748ededc60bd1161cf34aef3219570588d4065 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4c5e952960ffd9d4f34960606d7d139130fc319d93668161c12d1a5fe97afd0 +size 199058850 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b074efba26139d41e1916f2d94a23a04acc00907 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d90410f410c947441bfce4bc461e51dfa4027592a032527057bafe9f15b077b4 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea1f17d9785f51c183c888d08b7003ec76d14b96 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2e405e56ffbb32f8f8fdc422a4769877e84f53eaa2973e3d2b92d7c1bdfc982 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f00a5abe21038a88aeaeda7e6b25ec2d099b6c0 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66e11b04d45be9df38f9adc7cc4a8be63d6e0e3e82805ec0fdaa791bbd7da379 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38b4d21cef62d8d5136855c73545664546dd16c1 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54fc9197bfe01a75bc93e5cc71f5bb01fb733827e94556323a77d916fc53e582 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e81342cda879f8131d382e0305072868ef42f5cb --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c2e7f403d8d9932efc95123ac13d407a13980f9c4d0603ac674428fbe2600c +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..179025cc6e76ced3910682f989009c6e10cf8ae4 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fdb5b49f93918c81c2dabe921d0025a00974e4b5467ef0a37cf1bcd17491980 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02e19d423c9cef75616b960c094996dbdd0fc517 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43fb68d7897086e80b39069124d765b13e06e824339d9e7077968d65503fbbb8 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea12ca0bddcc942d38c86d2bf6244d8fd899fdbe --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4e01f7aba34867af261547dde34cbff50e04e8711a84cbe6ce121c393cc7a1a +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20585bbbe6f279f2ed52cc9d70d697e79c6bb411 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e2f475ca3fa9bbfde7cfe400801f5bfc505114f20ca927ad03fc760f8d7505c +size 199058647 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16f79d833d2e16ac499572254d2307228cd304bb --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0044e5cf0b282f57715f1dd80960d2950d0e6b1a12709ca61e5cfda26ed42d19 +size 199058647 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6462a85cdcefefad8896ed8481e80d92a59c4384 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f62731b6485134e1bbb621e38516d1c3cd65b9c6e8b736250f6102fa33bd812 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed8c527748fc693fb732544123eb5a180b6f39f5 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6fb8715f516ea138ac2ccbe3f59d24eb08e157b341b74250658d56ec244c2ef +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9babce82b4e8025e493f4d5a0f80352b268a1cad --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a97ccae73d1d46bab5d61ba9939d038e00936732ac864840aef02e6e5cfc42ac +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..847a121b9eef4660bad27340e3065f6077cd4cd8 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02d1ca6ca0a6c18404991fcb316e3ab21519036437acceaee97906818fe845e9 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01da4bd800897f9d6c1d8a74108c8cf820057a2a --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47812bf1ee623074e6698d0259c664bfcc207ce74d8ebcfcfcc2b35d5724b4f4 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3312f61e7b695f2c27785cd27223f5fd2114bc3a --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c422c2fa31d1b1e163b69462db609a66c0a2ea5e870c1aa54a9ebd4b6885cc3 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc9c30796bf36416a6392d4e7fcc25a25b54ad12 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58a22e0d2ce93d86aba36693e2c4ddfbd0604ca014a4cd32d31d7ee0e4a95aab +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a81aea14ba9473a8ac9784b6288b5fdbd5cded0 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b316a1ddf2ffda248f73f76542a0b5bc3c1883a0c17b25ecec7b476fc932924 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9143074aa60299cbd0b0037cb6a1d23ae1628225 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4eea2691066ca6b9f3474a7905391f1e40315bd1237f9ec3bb1d0728b74cab5 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d474b8f37c97c266196b4c052ebd7312d52a835 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53d39388a4978e8acc7d4c9d8f4ea1a3a853d10ebf5a995adcd45a39d217a14c +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26c1caa1705e928438befd0342969b9fab782a74 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cab376031e6dbbf0da7d89ac66503b2a4550f52ce90e5881772f8c10b2469c0c +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e45a6696290fe883bed3d96ad9de2be5b39632de --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a883e6353c4dfb56d0f7bfd6598b9f2eb8bfab0f80550b813cfe58848ab19460 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d32670923ece65f13d58629801bcc0fa4db9cc0 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac1630745ea3a44387f4e123a1a6e6133256ed47b67fafd8d06d2b9d911bfc7f +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7007151cc78fd2251ac3fec26adb938de2cac09 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5a48c19dfff040bf8d5459a0fb14d5826f79098f71de18f86118b36f5860833 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08fec6042e0c780a08d6225e40e44ed7c6e951a1 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05615995e6eb2b640773ec37bc89d97af1ce4787fb4d387465e71db726cef4ce +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..218e02372dd643f46926eeaa15c0a78ecf5d7ab4 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b84ed76c4570d55ba5da87fb940c8ce1fd3ae5dd8206832878b0a3129cd7d89 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d39eab963dd7452072158f1a7d55927eb0faf211 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66903d3e1ac00ad4186d077d24c7236b7f29abc1d47fd5ffbfbc8b8373113fab +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a295d3b79f21d277caf5c6e980e30de50160155 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0dcb7bae257de1db367eb3c74b69cbdbe2a4fc258726c6e7fccaddfcf536b61 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9d14f1bca6e306da2f109d9b02e860c871f4900 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3adfd0574beecddca5e2e3d66e199d269e8cbb01506d65616616a2a0ee0782b8 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92dd6cdd3dc80be121d6e3d1b283945eb7c9d322 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b91566fd9d08f61f3a197d06b846304e0f8f9ff1f5556ffaf490a410afaa2336 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f5182c4979d8710e33de3b4107c0c6526eec0e1 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ef0e4f3f5a1181a07f17dba9cfc4ec84e92ecb57e377d993e7e3a2c06e04e44 +size 199058647 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb4b19fd9010c3e96bac01337c18257589b4054a --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b50f2a908f809fb068559081d8438231e8d68878b649cfafa6afd8b934a684f2 +size 199058647 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c895b35920ab72012571f17401def09bb228cb4f --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b46f5539dbff07b75938200d1c69e4bfb23dbecb83ea420580e2289d019b6f5 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bea034563031e640b138596177ed6add0b707278 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d045f8ea0df55e25157600224892839a96d4681e2d84e796a8060d9ef889421d +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd133bd5fa0d439c14458b8568424c68bda8b962 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49a36d8c6ceac3b5fadb16ad0bff8c60304c723e31edfa908d2f7951f9853f49 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7071101ebc2ad5b0a498ec8f75c71e5af69bf85 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:257b95c52e546ce3c3cf644ceda96f67506df8983b98387ba5c166a6537ba6ba +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c22485a3014f9c90979909be147c3ee046e4b6f0 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efec1c9cdb44399dc9285e5071612d55afdd0eff7332c3312179ee7c34258b8c +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b5c980fe64bc2a966ce45cf0df5954ea70bd5af --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d85c5d2b63024763d491d1bb4867c08e152ca53c1b9a806726f4511809ec5f3 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5ba101ee7f206aa2544c7dcb5ab0f0d36c4cabe --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c712e4c1576cbee364c7494f9d140d9547f6d34a8f8e41dbe46d406d8b992221 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a96b856fe16cab3d8ab02cd2a67158093dbd904 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5443e0a1ba7b1f0e038261fbb3ed222e7180f920ffea038efb719e2054cb5620 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cec83d422b98bf6aab684c0ade164990a2d3d191 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01bdf3b50b128bc5c7738d4c38a71f26dae03d7b579b76e4b95c9ac1441e9d10 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73ff3fb23d820b5c26dabc6911931306be8d163f --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91c37ef6151a2573dacc666dbdc3acc458086969634c8082de053f53236c92c6 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a085ab55502715b62ff34483bf6b1f784b4a5ee8 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24f3425c06a3c947151ed95da24efe50292ddc9037156aa7f17d376ca2464f50 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dff1ef560d060d459a0ea79811c310233d93a73 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbbd6a314c3207dedfd0b07f8501e6b6fa4372d581565e084d1b81ccc657bea7 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b74171fa4b1962fcf27ca4228021254197ac8306 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ad458c1fd92f2837e1f4de8f6977613d86641266016ae9365fd5ba2d798ec6a +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66b500f4b6068c2c7ec24a534604652b2afbc26f --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d21430be5e3632855b426edf4fa138481cddf70e8ce14b5d657c3f9548830e31 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ed8cd7139603c1f091fddee6d98a1f735d5d094 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4570c14da5d2cf2bf1f8badee480ddabfd31f5aed3902ed13ef7c4d3c5544db4 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c11091208aebad3d282abcf71b5d13b76a6efec --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9db61ae2479677e24e20b73d3572fcf7672445a27e2daac79838f9562ad02b70 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7a961e93e854925bcd5a4ca584067edd50bcb7c --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a30ea270b0c5704d73fe4b447fe1ee13a8d3651367f69053ca6b01a2527d1606 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1616440b06e1b834b07e118b33e0bd18a9c656c --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:301357af114a0ad87c130ba4b3c89826b63e96aa2730f1eb3e9c6e668287ff8f +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1b635f876b3bc5b2eff26e21b13f9a4a3a42634 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb569b50ee3214f2babb7a6e312af35bf48338bf484d7095bdf93a7cb285130a +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48622f58a1154f66720979c58c3d92bf80315291 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c7f428a49c977a5f1de37c3f330d104c986805d80bf6bb680a0a762587fb803 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6019088eeeb488767da62cd7cf052f213b1b0c16 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bc854aeaa28a9b2d17414eb71254ebbf32f0f2e40ac74873db372d94013ede0 +size 199058647 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49485eb6049c14214f2a6376b6dfc62fd2f6af69 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5412fd0d029f8c6363b8b63a7afea4d70988a30dd50fcceb4b34c4642f7fdf7 +size 199058647 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ca9cd3eb07ac9296aae17f1d73a4e6926fc06df --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1266b4d0b414e4f2337f1fe5e0b2a92ac6a7301a406ed28579990ab514be9d5 +size 199058850 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56b2b3463d78b6b34d6f33fd14e7d03d600b4d5b --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e11eb4c0e6dc833739fbcf42d86b8cc3e97d0c5ace9518d8bafebb3871db7b18 +size 199058850 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e233d4b0ae34264104b5e6b1a92f2526a3b387aa --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c540ae417a59ae81954895c53a79fa66074e9d024d3f1718c492e106a08835f9 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71a0194f7dad736212457c8e8f00fa4a036fa01d --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08a60005db5ab43f1a2150b8f7288b97f0c605b17ddce3c9da5084b545e640b4 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fa2b1cf937efda2d77321ce278e2b529e57e962 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30f92b51605205b5fb3d5f83c2796c8622fba08c9e7b90d60df7ebe6ea08be1a +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e86497d69b33bf7dd2f8f4f8ca75ad5ce5e2d742 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c47392e7599ad0714784ef0884262dff470d474193c4a034262f6bfe4a7d9d42 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..537e2bf30532d357da26127cbf3f01c9b2f13369 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:254dd7b126cb5a05b0e1767f84e1a906ef5c70b3ce59767f3fd6ff909a2878e7 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c0881976a68ef0801bac7d0813fee82d941b0a1 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bb261d48a7d41d0337e2dfe526edb38d7c046f3ae2a65f4a011788371945955 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0240de90de1436158a2676eca6c6de1aeedd69e4 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fbf811ca6426fee1641f1a1456b57affc775bead927f1f59312710ca640d5ac +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42d9eced706df409680f0df396fd070c962e1d6f --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a2777c9b7be4a456931dc6ffe99aee4c2b02f34ae8312c6c037c0486541758a +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04bdb5ee2bb23d6bdc77b821fd85a37d277efd34 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53b8c282edc4c2c29b9665999ebba2b1824cbe50a844b9f390489d8c7954716b +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..031b28ace51af3ce2cfab5c08a651d2a5629390f --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12d5c66c6ab0ad12904bba91f4330af8f1c17561d98bbb9432989968bc7afa22 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fad284adc8a7d6853f5373e11d28117848abf1b5 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09efac9d0c3873456bbe63b802517cf931e80c7bf197698f8c8ad57c0a903bc1 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccaf63db9ea198c69777b50fcd6d86de6d756c7b --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51b843523e0b0111e58d1a3dcc502fbff8f1db37c67e42ed7b50d6d6cfe6ebf2 +size 199058722 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15425985611dc0dd4f62a5b997d8011087659826 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1bfed46084f2d12d816ee6a3b1f9fb03305b75ddec10df29f0093375157f7f4 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dca044a19b4a53fb7e222f94b35247da33d00c05 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:131d5770dec30eff5ef258394a585454c437752990cb1a647a1ac1c66c477399 +size 199058786 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a7f860bd23ca07c2c64ddba610aa602e5f9dc4f --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97abff93bf3be90f9a6b16ee58a4fa62ad15302875827907ef2f1fd98651f18a +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..180ac9a07b2d4afeb14a98191503591a38137b39 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c837ee0bb70569d1a16503f67542f842ba5f5fe1c87150e1ecf87ce19a89bc32 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4ebf8455f1ef07c9596360d81822f8a2633b133 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96a45f98bc9e381d03abe456ce313cd254efd404660eb8db76f35b10f225e128 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..274afb3df65f40e1e78419c00c398433755da306 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ea3306d2b3b33caa7c7caa7a68cd420249f7a9c31c9519a6f1b920cd7473697 +size 199058658 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2435fbb69c61dab131144e406f785f9b6523aa8 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27c5937287603e11d9867755547dce03b385533b20a10dd3c2c18058b316de02 +size 199058839 diff --git a/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fe4f7160f06c9ebdc64605cd7744e18425da7e3 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7858f04e33bdb81b1e62310df544c7359e202bf1f4ef5d76759f38329ae695d7 +size 199058839 diff --git a/4b284b28bc4seed2/global_step80108/layer_01-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e2e9440370740940310c5c6828e72656ee29a19 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:279fd19bd7263c98673a550cf69b74e2898ccf2c16be3985c945846a2cb4a946 +size 167511299 diff --git a/4b284b28bc4seed2/global_step80108/layer_01-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a4dd7010757d3c5ea04be93e43df2a10e601674 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43faac450f34d2aa8928847d88e234a785ecb4dffd29b003cad20824fffe8dcc +size 167511299 diff --git a/4b284b28bc4seed2/global_step80108/layer_03-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db9d81fc6e73c2911d10d60f02184b185a159401 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4e33c4925f4cd50fa530a741cf4de28bbaf5deb16dd4c4302efd752ceb0e9ac +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_03-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5411be313f854682ab6ac6623b68e192cc6c8a74 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:995c5f462a1a1cf939d91dbea66be94740ca2891a197e5e09716ac9e10b70e51 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_04-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ea8fb1835231c4bb96ae7bfbc1a0dc14d9dcd83 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a172d723cd873e46b718ea5e43af7c6f67a8e6c1d1ecd8a1c03cfa6d118b6edc +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_04-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb9c6180519574044de97e0f8b46516616249776 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b4e62ce7926c8f1be151a3c894440b21677b67f25af71be96064eb49ab21e0e +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_05-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c419354c030e5b58f9c66e2b8a26da229eaeb33a --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0fee70fa45877ffeed77239337d8e7ab193cbbac54b563f456f3daef46c51b4 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_05-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9dce002b4078bd91e36e4cd6e8fe14ed8ea38fd --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48c3cea93f54ce35da9a0394ab659194bdaae560839ca2c93c6a4ae630a31051 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_06-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c80d53ab2f0346c05bd03527751d6d26ffcc8bf --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27bb7d176b4b03cb88b8336bb25c5fcbad4b88f5d32a1249d137670e7fb965d9 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_06-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2e1b2fe08ae2dc21709dc202606fa1a3c072f18 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9239a20c711484f2888310bbeb421e2bb72fe162022d6c7b68bf3f41d15493c2 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_07-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a37eb4f94219380166b5fee307d785f7e7240999 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1807c3e9dd1775558b40dc77969f2f54fba94f0f2929cb323b5a707b9a89e6e +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_07-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b2bfb25981164a9575443251f8dad5a7bd4bd25 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e11f646405cf67c8cea420b9fab58ceb19fb66f88434b7e07cb2e5a2b6d98152 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_08-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97f6619d9e39bce3d3758951d211ebe969ca64ca --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03bb0bb757fd6ce291526edc146c89d084c2778de064dbc6fa5154ff0df88262 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_08-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb7612bc66597110e38effd226be2e960afc8bfe --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:467015cdae832384da1bccf7f288587b1fecc8330f9e6560ef2285af828c63f4 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_09-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2a0e0c78669bedcd897d28edbe83e4f6f723ca8 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95cb23d4171a30b633f21d777427bf89dfd7e3caab338a553189bc0ac819de35 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_09-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..329db212e00ce8e7992624468dfbc4e575eee708 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4d63e6b31523b4572726ea3a81acd16e6ae2a56be21cbd187380f78953f34b7 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_10-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2627915fb64b30b15eb12b30b66e6a6f16bb6dcd --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20f4e0ef8acaa404422d6321f51a37509316dfbe4cfe5c878a492574646e613c +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_10-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ec4eb48a5367b980b6b70ba71a2fe573f36a103 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9aee88b989d52263557663b666768439d45778af387820077915437da08d3e1 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_11-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..232f07078d9c005696c0cccaaff94d7f0b59648b --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d78fa4a1b72701fa952b5e87936baf2a6047cdcbd32615c6cf8330f4432d5e2 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_11-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4628b5e3fcd10b64c797a6fcbac8fe5a13cb65f4 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81c4313b6ca317b0a0dc44ca40ed2d8da6039cd290d7eeee56e8bc05e94a0868 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_12-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b99e7b61bc18e23c496929e152885e3a21d6fc4 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:477845182391e91420f05b8966e69e61090fb27878e4dafe96f62789454c8ebe +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_12-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..240507dde659a037126bc866380db4f5efc57a49 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c996b8a9ca1c9aff931eb9df9489b8f94e3a208830ee444d70c67f66569c8666 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_13-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bccfc3feed43c0751b1694a7c2a1b2cbde4b3a6 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:673c986aed8b4f09258c27ae250b068d07d56a064fd03fcbdb5bb37a6f652f03 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_13-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..598f1aaaf9a21a0ae1e8119fa94b230f310d60ba --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f118c40d96cf71d32cbf7675720a238de5fd622e1d61fa6e6c23a2aa0793e43b +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_14-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e0f2df3206e96fb951d092f13ad4c511348f62f --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1adbc5abea68fb20e83a8b18e3d8ac4cf632b6793de3e12bbd000017a0391d55 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_14-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a44dcd7ba6f34f5a6145d7a53900e5668959254 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33f5165b8db026005354dd21a1595e70251bcbfda3967623e8533059374b9dff +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_15-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff307682722956ce5e07f6ef8c768bf66c4aa3db --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b574bc4cc3d7b790c0fb91a03067833e4f5623c28e4860b958863133db1b5881 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_15-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0893e73fe4d7d712255b8c7ab3875a32014ca92 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6317078d3d8a26a08543de925608d8d586e4b7af57184693462aed89d1c41a45 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_16-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35765233ec3361565959035cf70c3e7d9d113693 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fd3fd9f1ed113c0a48f301102f1bb1f0e1df2cdbed367c4f61faf8162bd2ac5 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_16-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f661ba5c6ddb2db8aa664e15304301527af2fa0 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44501bbc157261119c0e61f9101a8239ec08b6ee77e540e6a340c4b9cceec32f +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_17-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e304bb090e3b78cc5ef2096743343c6ccd077c6 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35526d7fecbcf98f76c0bbed2f4208a521722dcb07471d4dbc78ea40b6d5a59a +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_17-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7579e132c3aa104404eb51fa46a04ae2796ed16a --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3e2bed032c5450ca9e5ff42dfa6cf599abb9a9aa1e10bf9f4e3e0019dca1208 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_18-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d01a8ab2bc3dfa81903259542dc9b375e50408e0 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4447872f3aff85536782cbb078015b352a4c93e437771f0c2df75d03b6b9b167 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_18-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00a3e65bf213db9152a88e04b33950c03161cfd6 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd758571bb86a76da6c609db63f89e8eadfc5909aa7d2950baf7a2b037d01149 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_19-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..398c82e2ad808ee7ee484bc7b875896624b4e011 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beb27b21a0acd62c5493c22425f68bc2524cf62102eb3c27a436f61a36fae1a5 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_19-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3cbc351ae197673ff2f199705416e7befaf3ba4 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c00af6fb26bf1dfdfbb70857a0015100067bceae7102569404ee61b09ac2d35 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_20-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f9374df0cab8657340410c1cab24ab60d79aee9 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ede3ca69ec0cd7f310635bbceca898b929b095dd21b2a2f8979aa9a9d6ac1eea +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_20-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e555813f2a1be1788c70c99e813136459c751e5b --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:464bb2d6d6cfab4d078a784ebd6867abe73dbc435ee8c6efff6a5f53b4763f70 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_21-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad483d3e9f102d62535dde8bc81f17748cb49268 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc90f5184067973b3f25f7529baf33788ed553270446d5c369747d6ab45b2ba5 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_21-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..940d1afbbe47ccb0f6a63dcce793bc822d55d11b --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2baa07b2c73e36535284406a2259f7ffcba019553dc1a227aa2d253ba91554c0 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_22-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a39447da40e1169e6221889407f2ef645baa98a --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49e9e450ed1ae37da8b60f2f31b1fcfe3819612773117412b516a868bcdfe36c +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_22-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb20bb11ed8babceb4161d00cee0cb794bf97584 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:933bc03ae54f327bd86411c5db5f3cb7f7d66fdc0a78be7c8ea05e52d8870a47 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_23-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8068ea8842c1946af2ef3c5f8e1a95a6f4eda3d --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7aba46e39ac6c2aa2d70c7021b81c18e3f0f30ff334c897c81a9228c4f72d9d7 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_23-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbb2aa5594f4a28e974ea36cbf7dffeabc484926 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7fd98b193072ca1fbb8dcd021268abc4faa324e72be4474b5bc891c21d4e975 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_24-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43f0923cb9c29607c51de44a28398668f2bcd5cc --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b24d505060eb15f5c8bf2b81b79083269a45cc34884ccf4f43102740d66234c6 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_24-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66702a70cfaab67895d3b08c9f89333faa5db80c --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30cf2e91c4c340e52331531a678949d584d05b290af2c144b9fbc325142d2027 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_25-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..164e3866e7f9ab9008445146d3de101386469157 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0368d72d1791c9a81afbced1ee742a5ebaa1bfc8b9d13875d950bd2d1f5583be +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_25-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23f16a6205be317dcbffd315b7dee8000164cf0a --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1246fea0c468bda6c95f6cb13f373ad515fdd0ac8950f603628b2d4cc0fd9ab +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_26-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcc1369450de1f45fdcad98581416fe10b9ef968 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:037dcdddea888871596e4c864923d5b30594190dc2ddecd841c399603a81613e +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_26-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9755d22041624f76fe9190167b25a228c5afe0a --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75b75a68a7c3eff7a8ff3efd5c1ccf4a7c52b79433184a64df52714f94022acf +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_27-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65f0a166ed22093ee889fd87fa6ee0c9a7790b4a --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:887b650ff9cc32fc045225900e8f7677ae56b97d1eeda1a082c7d5db69291e07 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_27-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39aabf0b76404e6dbc0288612595206e189dc4c8 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ec14061c816be6f05a1425e84fe7b407dab096b61a33c66f3b9410e3acb4bb5 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_28-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..256ab2e7047d9277d820b56042913bcb331de8f9 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:514ca2d74f3ee3cb2807e073eff2c2cb6a5633f33b47b8bc9bd9bcfbaba97958 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_28-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf422d49af6dfdcf6ccf874ca14e8c0f2e6b934e --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f491a170e6085189d89d20178f1d4dbb05fd3248fda96a36405ba8ee22fe2f9 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_29-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3bb71353269fc7de20255c7c2c8c8fbe0253b17 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eb51d48e157cb1477c4b03d6310e06c37a6d40939cc4ccad00ab49797e38c34 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_29-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f125637be5c6beb6a3807d2185590ae6c6d99623 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57b2c9a5bdd0ec51b38cd539ade1a4ab4cd0dc006b5b3f8a94137d05df9cf48c +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_30-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b4d192770e71c4e0d33b8abb194471cc907b7eb --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7a4366dc4bd78b9f8b69e0d8ce7b5ab499103ce0ca77d39e312f0d3431e3b88 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_30-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60f86686c596fb2af2f39e0363e7a1e165ca10d9 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e29c26a23389c5db0d850ab781d251e2eea9f50d24ec649db5d599d82092eb5 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_31-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5374bb238fed2f60aa879060d7e182c3342dd4c6 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9fd169a0ab22c30540e619764e26375b918cc7d55f4708171fb2d2e95e503e4 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_31-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc23a8c35a9bc019ce24a674c3071049a49363cb --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccf46927b5563927bc924ae60eb371aabf2caee6a423ee232efb7be7326eed32 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_32-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a69a510dbc07381a33b45d82e1077f3f672e1fa --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f52a96b1a14ceaac083147728f728f9acdee00d0f777ce379494cf6bd662fae +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_32-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d9c1678e21b8df8ce3317d35f836ba140571cd9 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6114aa7e3658601af17abc806ba5944312c4f7d2001d076be89222640d44f28a +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_33-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd132cf649f2bde3dd6b67c0c49fabe4af4d925e --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c3c4ff637ae4712c229648dc7ebbe5ca71f0892d4e957d82d49ec6911841160 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_33-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfc3415cd88170714b1f6aee443c692a211840b7 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09254d3e69f3daa63dd6ac99b668ac6cd7d59609a1bde1329054b9b91da3478d +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_34-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd080989b870aa4d0b82bd247707563910f5be48 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abf291d0e2ea92a7e293086a9d7fc6b83294d8e2ff5630a7202d43c4ae4ad297 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_34-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..482c37844c3c935dc262186918c10d0ac9873482 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38a842b5ae01c0772c5506c584bf4beb75c94aae0f9c34e55f18d2cedd27a6f8 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_35-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27f31bb3a6b2e3caa094f160324827eb888a5604 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04843c72033d1332e903d774682077bf58de18154fab9ddfe78daf47dd7697a4 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_35-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..404d9f52085fa1ba97d992f07b56aa93d4e48e49 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62bd0e73b5a6e1481719122103f7ed4f9d020c64df1abdbf204c8d9f72add157 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_36-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18141e32ac470154bf4047be758bb728789ef5bf --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:435e1f7483f7cca0e24a801d17924d878b74f905b025e574ed3eb2ef2bc408cc +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_36-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..094f61cf0b702b264aa5eb382c6dc7eca67b5452 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f259d0a853d86536c952a38ed0db8805bc1e19522c65aba3f1be0a7ccc0f5ac0 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_37-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..913d700ee0936950e18a597ab8e235598019f01a --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88428c1fbb7b720a836d4fae61f6a5aa997354470fd2fe5a3f95ced2a9b834a8 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_37-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9f35a04049ffd7277ea5e232dfc2b1bb02aed03 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f3d0bd6dd5fa32a5f7d5d625b4fce90604e94455d2b01f5eeffdfa49a5faf63 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_38-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2662d13d3a3a7d212324e3f845544dc8804a5599 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:402cbb05ae292352769d24806896318776c02ebd13cf105a48d21b12034e67e3 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_38-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..445a1818062d5e8b219f2f6ed91d03bdbfdbd6f5 --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80ae1e1cce8f66ed3dbc9d7554950699492f76a127a4fd81eefac1e4cbd67c23 +size 113308931 diff --git a/4b284b28bc4seed2/global_step80108/layer_40-model_00-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cc321bb90ac4876150f2d378515f7efec937aec --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d7da74727816bb743ee69fdef87f76848fa8085a302d47a29c5c89b830cd51c +size 13507 diff --git a/4b284b28bc4seed2/global_step80108/layer_40-model_01-model_states.pt b/4b284b28bc4seed2/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3157af2f31529bcf71b464cfbaec1d446e19011e --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fa6f9257cb11da41af3f22ed21e2a9b6b89e94831f3570c9aefd2053e23beaa +size 13507 diff --git a/4b284b28bc4seed2/global_step80108/mp_rank_00_model_states.pt b/4b284b28bc4seed2/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec66d01f3ea810cec381ae949c0568dd6fdc1cde --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:890bae46a648fc9fd56561f29f0716b5cdeb18e68a63154e1507f189c21c4288 +size 51443 diff --git a/4b284b28bc4seed2/global_step80108/mp_rank_01_model_states.pt b/4b284b28bc4seed2/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36e98a9fdb91dfef52980c7bc7f95b75cdc2a6ec --- /dev/null +++ b/4b284b28bc4seed2/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bc3d3bec914c655ebb9974dcbd5a9861f2e8a319fcd8731427167e641f3338f +size 51443 diff --git a/4b284b28bc4seed2/transformers/config.json b/4b284b28bc4seed2/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b28bc4seed2/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b28bc4seed2/transformers/pytorch_model.bin b/4b284b28bc4seed2/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2921306d3305949d445c51493e0ec1e0b0ab7b9 --- /dev/null +++ b/4b284b28bc4seed2/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a9e42ae0839f8a56c21ce95b3b88e8c57e0f1fc2a9c5658c7e9ae4ad4d0f7ca +size 8781203669 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd9dfb800d812fb58f5ff84a49b2f460090cb023 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e820dad0cbf5b993ad05f1e0b47d6bb79deb76a628550abe6c8ede655c46d58 +size 199058647 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..989de9fef3d323c53eae6da90518cf36e59443d1 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5971dfe1c5a45f29863c054ea885772baaf36f1c17504f745067cea500a55e77 +size 199058647 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b212df75e16a9db5775f115dcb38fcb955ca75f8 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab6701cd9d38ac3a8a79fd123c0bb46bb5a992fb817382aaedf379d9e2f80ca1 +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28369bf19f9ca67e07df865505986fb65707fac6 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:396404c7d2215f786ca39443a9b241b9e02541d7acb0cf609a1b3121f818c3c8 +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0507d7737632a9b4fa88786e212763668bf240f --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c267e19844fc12a93de2dcc860909ca5e93d143e69b5a469f3492abbb70035f +size 199058797 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e363eed70b1a3b7cc0868b4ca7c8f057f356107 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c13349fbfbbaaf36ea1b7973766d7a197d37e8b3f73b8a26ad327155a55ccd1 +size 199058797 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ed533ca98907e8fac939a2b5fdcf0a25bc64b5f --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e91228115bb89415a3d044790673c095f7051384e2e5df1ec04b0b3d9fcb5db9 +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..277e4018a1f052c76068f221821c0531f5887e11 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32928c9aec9ec1e87d8e6c3c25e53e42f2514f053c6a19168cb4bb9d09f9fb90 +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cea4024fa42ec634c263a4e3761c1a786a4f00e --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17bf6e0121cec4ebc577ae3c10f64da1b24544824cc9f3619fcf7955d60adbb2 +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40640645f5a70c72f9ed217403ffcc23339c123c --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66b01c326b7bffc76e5ba517881235b406ee25eea4d6c84ad507c814f80cdeba +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93aa6c72b5e0fb9a67c31a54cf21f7cdffed1207 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9ef9eb48088f1bce7f62372b8c2d58f7e5386922aa1415ee04949fc72cd8c7d +size 199058797 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99573e1833382db6cc5f1db40e8ff1249a25de0c --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:956ecedd415c9c51c662e9b859a4973ec6e5fbb2fcf48a6f04dfb921bb37eabf +size 199058797 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c0a7146633b2fd0c3a18ba00d424a71acb78981 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7391dd6e451dcae8327f3e97212ccb2214f99bd8f873f467b245cbaf140c2aa8 +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecde2d93c214c2d33dd1d38167e094ed178139c8 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc7d1b78ad2a9d08ac6d04f8dc39742ad876b802809c72eaa491750490c84821 +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ff4ab935f09c58b83e57f9db8ef4261a97398e1 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c15a4aa75a7760a987c67861b1d6f89ac282dea8a3a654eeb15ad098bcbef36e +size 199058669 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a1e1f07ef081ad4753cf5f638fccea6e55f5127 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abd45691425b3a71a1b0b8d2d136e467c596d74d93fb1d0bc5461609ce1d549e +size 199058669 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7a2fb8eaa3ab239da7bbdb12d46c1e1522ffc86 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c13743e17a8f67a8c3b49330e1358a51f599f99e42c61a6afc761563afe31e5 +size 199058797 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b912071ea0f3b22271391e1eeaff37751f10de03 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5cce55e672eb75c1dc547dc1f13dbcf681b916004f3bf1891873ee1dd8ce017 +size 199058797 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc679f63382ea7f93c20bef9009a55fd1c55299c --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7de4b84706787b72a5bf411ad6eb880e2403b2bb1ea62c4c73363db750cc4b5d +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c5a82ba3ea1860b47154a1022d57307e04a77c0 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa492500fd2cbf28256a30d1bbf6790a00b8dcd42c73b36d166f3aba94fe89e7 +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9db48cf2231e8a831770d4b9f1e6dbcee47010e7 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e634f5be5154da0c82677321afd4458810d0aec153dee1eaca1dee33d5007b52 +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2f0fb653e7f626158a9998ee69f862135ef0980 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:707cbb8c73c154352fed1ecd59f9a446e580430524f637668daf150351efa7d6 +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ec799f35d9534010c1ac02ea27cec6faf70bfed --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4f03b3a3c3d58c5a7a6f7736dca995ed798cd22a376e43fd75de456d3616dff +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e52fa3fe08c6fbd9381e1a96d9977eb8c03e594 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f0ab22b34d46b7247223ebfe6557f257592c5def1b2b3e6b16f9fdb1aad80c5 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b45e63d75a9f91a4d1eddda5bcb86b2ff9c61f6f --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:700640cd61fa5b3729dea0c368f648514df2421954f16da375e18e78a4d04594 +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dc7dadca881f9d3b575448ac941801f617a0386 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67e270393ead1d59e4237c613648a037080a477490afba1ac3a0ca804da6955c +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..216686893edf966009aca780f1e66069f2e4b225 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:197b6ae8fac872e574a7e4d4884f5be49e3a7d42ef41303af470b083e996fa06 +size 199058797 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f51ca2c7ec47aef1eadf07c557641ca53c9e34aa --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13b99350c00619413b778265b25e7244f22ec2505a81d1224c3a58a6d84cb536 +size 199058797 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0234473fc7d11fcede3428ec8c9e5a2d60542773 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e52fd398f40b205ae76b6badd93553c9eb30d8256c0ea7f76cc4e865e635e507 +size 199058605 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5892614779809a65144064d3a3bf54aaa4e799f --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cac4b7dabc370543170fceb9d1c205c645e7e94e60ba098a5f9e3365e91a89e +size 199058605 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d836ab871f7ff6c821e65ad0ce0bdafd638bd1d4 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d34095bae91a7b4d72a41e9675e7ccbbe722fa1792bb0bd660aeca5ee7656ce1 +size 199058669 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55d8af100cf82378c192f2c73c06dd0fa25fcd90 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2cd6e9d749b8a4076a8d1dc2648322feb2bcdc654c8ee430248f5b3c406f573 +size 199058669 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f072b20662af168f5937513c472fdf3435fd627c --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7281ed0a8a6c228c216f005a9eb6e803dc37a18323b8932c6989a266ded8f827 +size 199058797 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a684ca0b818343816fb99568610da80bf9529adf --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d195e1b41e2ff0b64cc674be7afc599cd34e65f79513b42aafafa61b04c2d842 +size 199058797 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89a8da7002b4d1507d5ecda33492179011554336 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:069df8c06d340a1735d9de259c6dbe9533f249b1542e635d48140d6d63cd91f2 +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ba8941e3e2687782746e480c314079c1852ac2b --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f96000d51c93ce60f39c1b5d7d755f1e3d67723a20e2fcdcf04cf438cff4295 +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6943db5bcc446ff65df7cc02a09bf4a526e7e95 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1edde1cdb6f45b88a22decf55146ef2a277642f268d222fa4b3381823666984f +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70fcb37504b57b7bc1d009f5c72dcec0cbbf9575 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aada3e1c052536710d4b072b34e6a4dd3e775df617011bd42a53c8091e42d32 +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..216aa9fa62b6e139adfd62666bd2277165a33ec9 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e71986eb12d8df324978ed475c5558c41217735c25d319af05b0747d91cf0790 +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fe3fbccd081cef29b5c179d9439e30c83651a47 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:411273e4bc2784fb081e25749b31cf57917cd14609b42bbf4b77cfff4508e012 +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..243be792f46439eb11c6ac4b83d76e3ddf960a46 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c173ed237c25062767f09c7eadd035b04fdc03b5b02c213419f2488bcdb73de +size 199058797 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51d521a9615f68552e7d280c9914f411c17a01b7 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d548cc685dc4f0991ce9501533a40d794f6f591fe82b66a3398dd5095c190eb6 +size 199058797 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..926f2f3630299cf4008af5e666786bba7297a352 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b02d2ff6f71c4fee785885435234ad7876525ab6ce6cc84e003e5679684f49ea +size 199058669 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20ef07a2b196afd5a00be4fc110ec6e789ef9d4a --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4214658fb792c9dab8e6765cb609faeb9a05dfd2de7ed5f93369add553a51789 +size 199058669 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c7b3fc1249d5d57a686cf16ed23b1be2a59eb40 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:110adbe08c669a34767bc821a7ec7dae74f3af78f1ec33c39380663ab8d56304 +size 199058850 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71abda3b68c9d05f1a10c814c0e1d4d01faac289 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e82a34358766194695a07ccbcb2e057be17e25e94cfe6e52fef6249c02f15f47 +size 199058850 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..384fc902a5abe5dbc64996aafb4ed72da33660ca --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1776a4b62e9f3a4f25ba79614a7974dcc26a48c31b0b5091626066fee059a6d4 +size 199058669 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8caf0589e9cd8a77b5f919624c8f06d279946ee7 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36cc927cc9074882f076c712772acb9a2922a172a2a904a45dd937e7010931c3 +size 199058669 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fe4b19a3ce8fea6518b4d63d8655367d60e778a --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d342e1a86b8f33f02f24b159989749930ace5f054b433f067d9a6750cb2caf72 +size 199058797 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..650de85e697728c828cd3285922faf11936f3961 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5864b064799ef4a0405d52f4340de43a2ee77b1e0d9354b4905cbecda17e9b9f +size 199058797 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e77d5143a839d7d25397fe03549c4b7f73aaaab5 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fe61b877a9cdb628039c9c761b134772ca56cbcc875105b3365878f1372db83 +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4807d8bf2cdb367f038dae14d07817d6c42932ab --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d837f7b0ac0dff345659a56a92a68b44e262d4d2a92e4fe000f6027681d9dbac +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4b3f1cb160b23659de03ac232446ee2e13ee728 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2aaf853f7db9e791e22e150937ec9c0ec1fca113dc4f5dea6eb40c8711e2886 +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37137e90ef52855ca4ef0e43e6bcf795ed8c998c --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c645af4ae2a1f3e785669b639a26f7d562e90234cf0bcc2f1a54ea99c53ed72 +size 199058733 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ecf4fa58ef28b812df524c97f0312b7e8564f96 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:377ddd868ff27e5b3c008f191094be8bf7eb7e6d6fc8673c61a2ce52783655ff +size 199058669 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2d7f7f10df6ae480bedb736a6c02960f24482ce --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d39b0268f0d3bc6006aa8051f39b804875d33fef859dcd6b9602d78197633a6 +size 199058669 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb78bf32f681bfa245c0cd06bba0c4d0c51c6792 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f64d7c9552a15c1f55e7365f3e6cba54ae1cc7dcad3f21854fc544f126a9e44f +size 199058925 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..efe674dd5f43b58ad59f4753b26bd484364d2f22 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db29e75fb57c7f9595a0407102b28c9b87957049df652760cea9b1c1249b3e6f +size 199058925 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b083dc7a4ec5636a78d1d8919a9d6591bfb5227e --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd5ed921416d487d2321335fc11a0d8764df5d57be7a1256e8f3f7a587a5f20c +size 199058605 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..751115fb209c61db9659e06a6003eb88b4101dc1 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:028838a9cc6930074eb8a950b6f17e2234211d3b149804de2782435d956d370b +size 199058605 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..097d0339f13573e37be2f4be73e0955bd1ec14dc --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d38ba485e88b61e5d94df9b7411d511756aa7317e3bdcc16ff959223fd32be7 +size 199058605 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd930b685c81573934ae54f35ecadfcb58ed7faf --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17a3595ddf1ccb1373d6332f6bcfc3779de0ba78dd5001f8ac158abf978d84c9 +size 199058605 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9891785e98d77bb31e15666677ee0e69ae4d64e8 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ffd6a9451eb6ac23d9442dc0cf706b1a8c2fffd8c658b4d896b95c95b2be879 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8294ba79b55e55583abfc5f391ff63a91f66e49 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad8ed4d94a1c1025ae5056c52e7d66f5704c7d78b3243981d7681358372750f9 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..562086c2f90a47b826df7fa32954d38f10dce458 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:736ad9e5cf1297692831fd0fa660bcedc712e80a544a5ddb4ce5af236d075567 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..942768bbb1bd6d182e54aeab5f8be10fc0045b7e --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ca28c63691cb4ad661f933b1e70c3872f453272f0dadd24b8c18d3088a9ef1c +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78e76f0062268ff828e7f01d34a5de43b47be04d --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6b44406c8915fb27addb0d8798ea00e848025e78342aa59be09a9a62b797e63 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a229174c3701bced32205fe11bce34c22060afd --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f4de0607db904e743af5e4be4c49385a2a67dabca7081fe9a6350a02fc8a2fa +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fcc10e855b0e531ca0922712e7cb1c0f7f70440 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ec80de2dec32e11c0665a58c080552c10f53517ddc540eab8d2afdcf4b97bb8 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d2a885f706710bdb6624ba6dc677d35a73dfb55 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba36000cfd18f922a021a842acdb50baf787d7d40c005f012a87a84895bec274 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1eda29a6c27c0d265693d9da521d124911cec54f --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fb6caa7850de97410739c3daa9db5f1759a3e347689d3ff0f773d21b61a0cf4 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a31aab494d6dfb2d6ecca6f00ec4a608936d4800 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a6ce829477626a0fdc8288b7167892d7ee8f89fede534079526a6768ea80737 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..154914639d204ce7e28bf6f2681a78be045aba1e --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b68e8108e57c0f3c98700750cd981f063192eee28bac7c9985a15b828628e5d +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b4d4563151e124c93accb5216844cd7a9cea52f --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91ff760e6a22efe6068754f70a6f860f414942bdefa727e361cb131674d381b2 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9ed0e1fb8b4153832be90a76d7e5ddc7d790b24 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39255c49ab0456be04d8e9227570e4fbb6e30dd425767225e6654f8ae9acbd4d +size 199058978 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..409141e51581d16768cca545eac123eb2b362273 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a504651243b1a3026a3ba9a21e85f37d32c0ef332f76419228e96c7a9111b578 +size 199058978 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc5de88d088ca91fbd58d026a69b2f6430bd6729 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac029c84998c0144a1c5c260af7fd03b904bf4e2b42074302a26ae9362785530 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5ec252e41a671b4b8d3243b79ff4d633b4fced5 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85d6e8a03d0c670e0d6b842323ec84c4d8384f7e3c9ab33b1c8e51288f888dd4 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b36542030321643fd0247c89904c0c14094ce55 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24d62e8d0387ef52c02c95dd3a922e407fcfaa709fa5e9118e693618c3592c7d +size 199058647 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7905552a01b6a3216684bd917d0ad6365c53fecc --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a28a13b75d7a7c5ffb68f7c7316dd59b69d1f00096b692042343852cfebed2f1 +size 199058647 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddfa524373b4654c2281318b39978ef88f36e2f4 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36bddc97db22799c9dd8904d226ce461f3ed5bc3e1c4ec19470997b17ab712a3 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b096eb3a737b0b1a3393d13199806afa8afae64 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5fbc9d02e92b499a6e30eae407ecf8c36c64033557ed081ec2426c665a45f27 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc3200d9bd98ea1bdaec645861a62de94a2ec89d --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30cf3908b2695aa63361c7c46894e4a59d8d519d5c56b72ad31f92359e576ff2 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7247eaa3ab359121311fad0da3f22a958229b4d --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba3d4896b2fa1e95aeb91ba936a97d49dd6c68569c0795eda3c5949845bb6069 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba1356563de11d2c416044c254bffe58abd24744 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b1298ac3c636bab595b7852f2314953004c6d63a18151e1e29ed8d17689562c +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4d728125b03b6b06bb27f7abe0e18abe954eb92 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88431be136128c72d5dd186ddb480dcd1cf0f6867366565d908ad0411e233723 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3844231b55f8b2c4705722050ce672143099c334 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d94e36bae8c02c3ee5cadf0cd4d042296ae39d7d1acb7065b519feae9ebe700 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b30dbd3b7235ec241f04a6723c5301e5eaf5340 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0367516357c21914a0b945417c1a45868e0ba1fe297145589bfecbf0cd68cf09 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79b14cd4753b597201d1374c333a189c4c90d8dd --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96907115d1f3557a46fc4791f5e0caad024d421f5b57e116c3e1a70f9d90a0be +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cd90742afb4f22829cbcdca84507ef4c766c6ec --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:939309d163e149ed3d132e5af4b1754b2ad296478e33fe1dee75a5fb29015ca3 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..776f9a3a98ce9ab29ef21595703fe35ffa9327b7 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:404da366bceeb9469606837c6d6c9d129c5a975fd991a1d91780c38dbd0cd533 +size 199058850 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a44c832615738acf73a0f6e394373e1e29364502 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:962984354d74b9d4ade44627c91d75fac8e9ad937f85c708908bcc4115d9d5ee +size 199058850 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5476c8245b0c3872ad585b3aa4c0cd076490aa5 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6eaaf8bac562f7b8d5f0d3f39385516cbb3f255b95357f8943bd448b108c91 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfe3604055d73470a50398ff62916d7fce5d5147 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba23c56cb61b0d3a4abcb9e8bbe76a00dfbb6ce5477512b7f9e270d6b13e56a1 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebf6f92af61b61fc10fa2ac1165e2f86a8a3d707 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9738f87e3545aa80d23ccaa04c86bc824fcfbe1d4068cdefc76e3632510c05e +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95f859f520fa3df978cb12793d50ce3e24e8e380 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d77be2f5f97a91b324763560d0339e2411fbb2bbe359a0d3c221b096810b07d +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfe82b643f1413c319c6429c54429c16f1fdb6d5 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70ba3b191623eb3d42abf1be3ca707ae38fc276a0181b420544b191eb0840740 +size 199058594 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9545372856f41730f66e145893a205db912b031 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98ff61107c6479b3a016d08153423cf585f7db7cfb9eec270b11fa63b5b2d22b +size 199058594 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e28a2c24b035369f08d3c648198770963f9e9ce4 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7494ffcbe0f74570bac27779f08cb80b58a13d45b96015b80c3c060ca2f87f36 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b91e7300a92151b4ebe4a851581d8242542d7959 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49a3764038d7b531c438c0cd59bdf823fdb9def1547aeb83faf2911284d25759 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11ec1d7a1fa1af0727ac3c6d9895e5cee2537158 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3931345c680b9a29785637341489d19e89c3ed715e8146f56e95c54a7e293b1 +size 199058711 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f45504ca67327e18486782677c674c3f6628d241 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cd3ddc30064a73d1e478a26dd798977b554ed89651d4ef25dfb6e6bafe20646 +size 199058711 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed7dafdd7b7a36ca13ef9313f0bb54f7badd6fbf --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cdccb2964403f22fd5c03f781c73b97dbbecc1d8ba7f0dcefd13bb9bd239e87 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb4b647301a45d1149b263697bbf1a530e95b0b1 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dbed86c3803c4fdf5a3a4b977fabaa6c04c4222bca64555c22f1f1e96b9ffd7 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed0743a738335cf801c1afdeb774c7d373db5a63 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc9bfd898494908f4182198d80d92d1c8cb98c1250706166dddfc495e16d1122 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f7113abdd1c21fb6ae6fee11f5f3bec3fed860f --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb09c1c841261355b2e794ebaa0d614ad794db1c9468574b818b7bbb33fb6d87 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86d4abd4030e8b587d49d9ecb07f1961e5443a19 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:694723bfc51cedb1c3dd70ab879bbd1dc4c7aa2892c94cbc98276b6c35e3e9f7 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..543198815184e80cae3fddaaa76f247726ee4dcd --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f42147dbdb33bb9597820661cac157c380501e6be14aa062f5639e2c7c746b90 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..043278f01a49175c3ae25d20b7f44907d7fd128f --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ecf5254fcdb493f1da1dc5c3b379f5a5bbf75e48d1d3ff51cac31077724e5df +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffffabde3591fabd097751da5d03e854ab559799 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35461a55078d79f3f8601f98106f14fbf737d50537c6a0ca006476223cccec16 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5a8a0c16b24e0f040a703bfd800c11782c0f56b --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a0584618b26c91dd62fde91b9cdc84a160e0302a3bfd45a1cf6a160507e9e26 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1eac3d28ac9f0c525f95025b4d68d709a893a4e3 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6878ba907aa7de88b4b7bd5f842d453e1f7fdc011dce6189aaee67ec17bc93d5 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11a00421ed9db0b07e4ef8599c83f844d753f76e --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26654cb58cff829bbda6887fb0d937624489734bb8f8c01f83c5a83fbf35caed +size 199058594 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1fe8a29182601bec885bdc00407cd26a053b0a7 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fff19503789d30fd66b725ec474ec4a3b0a9c0bb0c80508521920d36618b7c80 +size 199058594 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..decc1e00384edde173c33f45531cf02a056dc887 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7716be75695315776393a040ba617ac1aec0d3f9166e48c6682dd70b150433f +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cb2d776986e544ee0e8715820d0111fdb903fc1 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36f6e60de013dbb47d0a9c48629e34f3d7f637f7a942ef2fb8f826e1face0844 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..701d33986ac37190679ff040481cbda10f0aeffd --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52e7b16703c3bfc1ec491437b62e8dce109a933a7c0eff29f60a240d1c9a313f +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ef256800c7d5e56b20d27a5057571164c418cfb --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21e6a0179531b7b44930552b5f4cfa4552a69ecf3a5701d7719e213dc33e0cda +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f83579dc8c1e9dac2fddab8712354bc301a8deb --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b732af4c73dbf7db61b8e154d6cb7efe39ce6b92fdd460280747cabb84229d56 +size 199058850 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4903e23ce0fd60d96ad567071ad973d90b56a9b --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95e27346ba5497e2cd51390c09168b6a9ca1eb169ce9da76b97f7fb4f00ad4dd +size 199058850 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f6c271f3252df3f68d278ab65d7450e7a4bd3df --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:041def2ba47b4053745e2ceab2d28baef1ec4bebedb3825905f9d8a87a8f40a7 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..381a85b2ed8c3efa3edff78e868259a3ed571ff6 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d519b1a3b4a02592f0f2e912f3b12ef4b679ed55db4498cee0bc3d4313421ffb +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7416bcc78ef7fd2e545cefda19987cd5ffef0c32 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60793ea03beae8e20c49afadf06101927887cce60dc2d9cc811f3b2a6f3d3bf3 +size 199058647 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8326494e80e8730764e55d36115314d6feecc71c --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac0ae37527dd894d610724e5d8fd690c7f433260974e28a0841003a900b183f6 +size 199058647 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36cca112b0c4603019223c3e5c7e05121b1d3278 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b87901b43c48871969c0bfabbc465d7b4b0fcc3347e85fb382c8ac01ea3e8ba3 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01b5b1161c767e365698d71b007386a9d5a9910e --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18630489281e64f988e6f7dedcb7f14e1f8db447d48ceca112b28574645498b6 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5036fd5ca788eec6b36ef83945451a5a1d17227 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e5644f0f2b1144b27bf8d493771b550509d909787bf61ec0bec0108b8ac4169 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..713e2c5b61c5afef86159813e15336f06c8e943e --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a98d5d7f6145b5f90419d1ea43c6ab7f9283e9cf32b8ddfb70fbadb405100f66 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08b8f826eecbc46395b110acc32226c00adb387b --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa2291436a36f397cbc2727891fa98a74a1e4b65929bdb5b0d6795cb92701257 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..52a6dbb69eaf6834f438863a07716e11ce580ae4 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85017db6d7bbce6693068b6f816f053cd5f801080581bbdb581ea04ba35a8ab2 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ca88d686e27f531184f91a7e6b2a6eb039538ff --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:126c400b3b98a836726a5568c8bd171c2cc6f842028c5b3ac2f2e8a7823764a1 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e423fb6a209f4e421c3ed5ba416c3fc016569a45 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe9ca3c5da1bcdf223c150daf9bd96642a2349f368babd53d1ea83e0fa55eb75 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8826e26e5fbaceaf9d2c5f46c396aa57e7654dd6 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bf4bf7108cf2d32de6aac5c0114d394b593fe37a86da650005bcdb98a029343 +size 199058850 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b723b1ba8041cccebe109ecbd616142c6091e54 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:248e48a1951f442b2c4d5d14848ad1fb0de19012e140bf7675022505a3da5430 +size 199058850 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ff97dd7721ade03990c05f54a377de12923a9d9 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52d775852bd9346cc1b78e26464ec6e863a37894d135a95add931962f9b914c9 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b3cdb261bd8cf3bd123747b57280f73d011b6b0 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26e5c3de0b9887c2f9f37059088af598e7c0595603d75b0f11398cd07697dbba +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b282875a66210d50b9129bc66cf30a26253054e4 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc91e7c9933c28c8c156b56f67ad532fb7fe25c54b306a202ce3a353037a3069 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f29a687ad9c8c3c9fcc4e5d0037118e1c7613ea --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61ec5337ab0f42018bce4eb9141b1cddc17b372e152e76b127b18403cd5f0fa1 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9b8c0dafe03da8cfc1231950bd90a2ad99f41eb --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a93c37b13856e553dc90f30bb419020391c014b5c8ce2f7332dc6e6043aa77b0 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f53cc56cf27051cfcf99c5530c55c1629345f4d --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17ba5c23f78e72b45b010d40b5f4f0dc06d9af852f3c6c26d09484b8fb570533 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1544c99788cd928822a3ee4ad404378c36960c95 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7331a151f3af0a6a29f705d452a1bc7e1fb3fcf9db5dc7df94bd5894250bc848 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b6edcb6ac7a45085d4b34fab636f20271c45eff --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd2057ac3df72a379cee5da4c3ea3458a1e6a2187cb920f0e326fa921f334b03 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..086c6abcb00b9d64495c2d15d05bfe49c5cc277d --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:233d4df1084862af2dca5ef31ebdaf89f2a02a8490d89728e6bf4599a3ce0a8f +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddb27211fab445b618c4b2efc9ad9940ac8b33fd --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ea2cccd2d6102a023d86b0e42dffe156c20b81c516b416593437f4f39c9e30c +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbe2920f34f0be69d2e9668cee7589935de9850d --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cf2dd15a9263c0f624bd06669ccc8b48eed978c21de0a4fbdf6ba3b322a037b +size 199058775 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..333f95d5047763cac9b7306c18952f1ffca88de1 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:696d29d82d914ae4926844ed5a24fc34e005d32ca84c79d17131b79bb5eee574 +size 199058775 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc583ce85bac067d675721afe111ff0a3e9228b9 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:995a4716bc7fea22d7dacc87c0fc6863d6566453d389cb39866c517a9a692167 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44cd39de396679a3de67ab46aeee4613196abd34 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95b9ad5ca428dd16437a6aac118fcdd3b1e415d1274cfd0f1b08b16317224f28 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3028c1361e718395565199cba0f406542e215961 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0930eb78708db8e0f3ff2f95b3a1b8982c29f969390b0ec5cb5e6c3af635dec +size 199058850 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..450818ade9ed11a53c02712c113295aba48d165c --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:600f86aab3afb9ac95beacf68d41b231d539623f84eed75e5430d6988cd0ab0a +size 199058850 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10985c4cc1b626cd361f6e116c3a8ca504ef12eb --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:662a3b4738fc23ebfc654833ba4ef97e2030fa1d3f3cc20658a0a460b578625d +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73de35f64a90f124918ddece61c5c615ab2a6c00 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b449a7ce56a4a4dfc112f5019d3f9e7e37b72d56fc681d6289220237386557d9 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a8827fb64727f1d3e7badd353f00cd01e16e169 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae421d15d0d129403417384bbf1027a27eb327dc9f93bc5ac2a5f63734c9d654 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03f92bc51120843f643962a7cac035a3318fdbb0 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9069e86308d2cf32832d9f4b321761d09cadeba37ea4dd57f719c7a64f2fd072 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3cd9997e99360eec338fc88187839ba098b336c --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8de7321469a671d6874f804e60e81dd0795df4babaceebb4e2a2935fc3caf662 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84287614492197bb6fdd10ede048abeb833383fe --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a176951a3bdb6074021090d50c74589db7f0e189853b1bcf4a87fa2aa54e4fac +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03d64b3b03de88e24a5bfff6228ab48878b42d0a --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff18cf44c52c4b345302f7d278a75e57a116da28182cf99089bc21bd9c86c290 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5be126334ed96d5174636540bd7680350d66f54b --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48662d2de9e07cf15cb36357899c3202c3b051cc224018485c1dbb873fb824b6 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9076b14e5b5c1965fd1660218be477c64b2a033 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:862257230135e821ac074414352c068e6cd7275e71a303963a0a392bdf977e4a +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c584713f677a7b572ccec0e7e13a3edef6d3b2a --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d19600a134a99d9282dc93e46cd8822de022c99f6e68d03f12311fd62a6e432 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdc67ce793afb93dbe339d97f0071564d48414b2 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:009154bda0138cce6cba94ccf1d3ddeca45d1acea9b379aa4ce737f33ae926c0 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7f90e2d372fcddce19459676bb7f611b2146ad2 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f1f6204244a6453583866a747ef5cf042461d6fa936f20e0d5202fb750725fc +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8899180b0b6c9cba414af29d72c1f8e6eb0bc74b --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec4a6919c7f0b6c4a341d7e5a847ffba0eb90c8259519f01dbb019287d804231 +size 199058914 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a5fa7b222378c2c497ef6587c96bc2167cdba95 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2eaae729806e4311312c859541fe02497665e52e67eff4ec8d38f897dccc283 +size 199058914 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be4110f8083af58d99c4b64ba454ce40f2f78291 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f57f1b6ee2f1bc2b4ca8705b6fab5c6a437016f06dcf6e99d75f2f7fde8feda4 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c34c8dad2f54c6e145aecd74a893c770b0097bc3 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12c4211106dfe958b619be1012016e1ecdb7502eaea2f5aaf5182acb4068a86d +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f84378441b8ac65243b7bcf35254f42eed94a726 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71ec3a36aee6d55602c6283790dc960958738efe30638385ad138b88726eeeaf +size 199058711 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b0fa53d93ee753ef72b37082c2c6ea7b6d5f9b7 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10686f66410b96df9799fe261dd80acbb7283f1ca94aa69b4f767c79710fa6f9 +size 199058711 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5487c196172b34c27ae5ed4375af1b5bcb4f9361 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31504a0361ec6d142f0d7156933a937af114d1dd83ebb07da67a74d0f63325d3 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddc68b4ccfeeb3cccd5e89a52011c4081f49af50 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f94e1c99597fe237acad1c392c1a1fdcfd618143535f5956d0e53ef6b91d874 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a92ea959f30b9690181995c976ee2c8ee6b1e953 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b98bde96bbe7d4bb0faebefd2e19d7d031b8fa5234650ebd6015704b4558f69d +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbb178650170c38a87ee4d5f50cc10225564f370 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e112ec49b4957dc414ffda900fe06a15585d6d4653113099da657d4d971767f +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..876d5b84c81a2327580b81d11d1130b16e003bf9 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cf32053967f51094ded49c730a9f10860b430c88d579f4dd9d4d97c1e6d4b77 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4806dce6130cd0e35e9e0aaeddbf6452da91d22a --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbbdf4cd0755aa5a2747047cee7c4535d12280bdb30329970ec853ca553b4fc7 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0933aa1033fe320f4a0760426839d90a6b9cd193 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6c6fff0bb341adbf38feb69f87634e3ccb2d8444e1257ad6430c3b81feacbc2 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..464e941a85e1717e74234547f67ee9c1a82ff03e --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51f905c5e0cab8acf093ea990cf89785650ad5e3797ca133acb0baf378b243e0 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..725f1951db4ad494063962328e3d4f9fcb2ddadd --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d4fc0fc93d29c4802740df399272d88f81bd8b5a4d2973b37d10f2dbb8838ca +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a24eacba512c317ac26a1a4c72570ee82fb275fa --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1a761728ae87a6a80a51b6dd79bede1f81c0f3bd5d205191fe42af46a0a1170 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2eb35c76985f4e8a2246b87b5a6c444a4fdf556e --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5835087c5f5e307a003878e0f3b38eacda916eb4746166e8aff13a57daee5346 +size 199058850 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb68da5d30e22c26a55ef4217abdc75f2199743a --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b457c8c6cf153521c2fb54b6e6b37ea051e3f40a52de4dcddfa344b2ec52de4 +size 199058850 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..555cd5980f41a1ed282d93e4928751d75f6a6b65 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccf2bfe40c6eec01dad7796dcb8698d8d1a8eacb4700de90e8f924c40bc001f0 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29e2098810d44d043d1617508a7e3f1947a46312 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:047fe067bc96918edebb4bf49c09d9895e5383ad0981632f1a455f3184852121 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbc1a43110060ade00dd9dda1bc6118644450cc2 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d675d3e0ae35ec3168d1c880c117779cee26f36ebba57f9c81704cc956793d3 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16854740e87e301be60e0265e608d2c22f073ccc --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b67fced560b13dea2e06538cfac16906be943bb9230cac487fec0622005c3af +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a1bfe064e468b076ed4fb1d08571bfe97a2d5ef --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e33207aa83b3117a8ea8266576c08c9d06b42f81a2a4bf2a0b2f70794997040a +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..565a2a2985f7f57dc3b38eeb655381f09acc184e --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:287027b929373b8288f8935c81dfa02ffcb064bb44e124e87b015ca6d98d2a5b +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad88bf3575e4bdc1c1124412da4967200d1a5345 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7eb3607636da51930b9a787d06b0cd7ff239ef6d69435156abe2cb4b471b3e5e +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40fad83b75c6e6f0b42a90748394d8430b01ab66 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e22466f405b3f8b2207b93607af09307bd14987acbabd3471c894fa7dba93358 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa83ae26e19336f5c7518b2b6f3dd68502b01dd0 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3706d9cd5cb4bfa9e94ec387ebdff76e1ee5e4849aa7156db37823e7ac2e6888 +size 199058647 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cad07e5498280da1640a5af72dd03a94ad298d2 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d8dd8060a7223aa33fb1691627ee00367ce660b37a46a606b701464b1c574f9 +size 199058647 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..059d63e56332466df7ccb3315cf1eeaa1ef0d0b5 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a77a1c2ed24dff9e2b701d431d909d5875c606bd0b40c70d7e64a55ae851d35 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd43215a69334ffd3baab880159e182659634c2d --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2d928a112bf892d5ba25b25ff3412c8b8c1b1787a8f05075bcb4d4e3bd4722a +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65d425d504738f7de5e73f1790ada5acd04c304c --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca6cd38d3716869abe15970551127f01e0f37fed9a03018c492fe1d9891bb811 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10646e8da01c3497506136dbe4db4ce7bfd2a7f7 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d992c801251958b33fc5265438207cb060cdf76e5c293b88afb275596d21f2f +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77e60139121799cb131b0c1996f2cb0709e1aee6 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d85a60e2b855eb4a4817158d396aa00b25f44fcc0c2e4c77c8d3ed0aad360df +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3c34f5e3a7150f9205706fc8f07fa032945fac2 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7af8a8df8d13f4e4729ae4d2e20198261d752c05730e165a4c347e97196e3f7 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08b118549249b0bab4dc602a52113e3f21d30529 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2307e286c67c5f46abf24197787a51283f675c33c95c529b1f0774fae8b8ef30 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c255cb3eacc5207a6f19ad3a5f4ebac1ac14c74a --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efc97e8cb7d1d7ff0bdb0ae0cb202a491025e268a3e8fb958f905df061dbb9f6 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f47a55d28ed24c21a43945bfc09ea7df7e007e69 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8f89eeef65a425b97d0c5b13aac97884c5b204abbe8f338229700192266fa65 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b966792271059f36952ba0095c1df536c317b11d --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65b6fc0d464954f6b554076952f08205d85f99dfadfacc7ffafe975481ce1ff1 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4945ae4966e3b6081a567269c68f394f6a6d56e0 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ba74e4cffc82b7e05b7bac978e24fc18e4a0fe314f958a856d67c51f181edf3 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e136d9111dc341cee8ec1bf8323ecb7a7c0a3021 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42b3f1e67f5268740718b962c8981fabee3a5393a3f964f382ff27f6a186fc68 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e726b8f1cf91f5fca543a1eec38e9e5ff63bd027 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cbfed594d6aa4fb405f37ac2030879280003e2995c9c45bab40620a57992796 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..859691e8b690337473e4c176c7c6393e485e66d2 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:525589c942c2c3dbc8192be0e3f2c2cb79ae84dc4da7e60d4d933388372ec614 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f165c7c7ec658654d4c46a1ef609adc0a8d1f94c --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99389379853fdb2900750300f0ac6e2543ff1d48de18e8254a2a11abd33b4b6f +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aceb4abe66c4fb863cd5f9dfa01524215a827794 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:958c5f30c3ad12a8dbbcf4d563f405f61c368292b1fc5442a2369bc3beb5b266 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90931ff3e06ad7e940672af1e28f0b4e483906a5 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dafdeb17c6b0895d9a862c5bd91f1812ed5e30274f525bc58036c25341c314a +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ecdf697abebc655e5790d1b964e45ad237c0e36 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:120cdb8122f07fed2e3fdeeabe7612d3aa486ecc30ef065eeca4072689b41137 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e6de4a046a48f8824aa068b99ca0e235ae54225 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e46bac2b91856aaf6c8ce632c55cc1066e811b71736c0591442db03fde4fab05 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bef7c741dfd782f19456bdd944a5af8ca0e5e89 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:212942de683ed8e1bd0e4db79b1d1ac9f196dcea62756371a7780d0d04dfed84 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..336cda6edc3843f3927fd000aff203fce37cb4e4 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6b8b2828fa983c20852df34fb1807b43a3236878656a9afa011a893b95ab0a6 +size 199058647 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..154ae76d0eced91d62a8496eb5b7fbc24d9bb0ee --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85a117c0e9cdc34e29f91293bdc6921bd58c200123bdcea2664a1faf77ab4602 +size 199058647 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..692013a456625145107105839845b5a81d6f5190 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d38050816cc99c920d0582357f6733bdd5c249f5415690382c47fbb90ae635b1 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac33cdc8a1065ef038172caa228e7bcd2d89b1e6 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5755776f8caa32e932bcbdcac9fa63836f6cb108b232cefc63a5e0dcbcd1659e +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0847a1d0638a417fc5339128b9b4b51daad7e36d --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d80986fe819f57ddc2da4fd293be748985f586c55489aeb6080b1032edebd15 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d9f663753b25a95ea3f51630c28d284de9537ba --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be9e4767c637a87893bf0fbc5245e99e5783cb93a05e14c306ce22ca5ec7cf91 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e104da382abb66a79da6533a02a7d2c5ec7bae2b --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8749c978c0ef6da31015cecbd8dc0c93b6ecc6666394bb36e4aa9450310d6ccb +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c516d274a0f0eb31c4fb89374021b9e73344c86 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:869c537d71d428dcb486f6c747c901ac1ff8b5a707ef0674dec85d2e6d1a0f64 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e33d3b5aa4de79c72f53cab97d33b13acf6d84b9 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3da764f456267f203313afe2f64fd6a7bd1037cadb02c03e474222660b58caf +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c989a87808212613749ce58383d9310e44c0b2f0 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5b5c164454853b3ce9e459250a7491a29614912264981debac9143ca4028f9c +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a659cd6535a851b8076f6cebf9900aa4d9e7f810 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3672f467fb44e3ed939cb49dce36ff3645ecff5bb1adb6bf1a262c432a90e033 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..318d0ee45bef3c6d93e5f880d4d7f83510fbf9e7 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93a4555b1a6c10ae3081d8ca21dae6f56bc191c30153ada4c1a7e79fa4fc875c +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14f6fe9beaec660e6738653e558cd4cbfd7da8e2 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9cfd98e323300d0d54fdd484e6746cf7c93ba31ee737dbadaa17497a7eb2159 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0ce139d009cc0d408b3ac5c0ad1057b582efc81 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbf7b932073f1b8e079d117bb31ba4a510781c175afdd8462b7062df39e1cdf3 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e98f3130662ef690e00d356b6e7d66e7c06ba0f --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2e0d4e744ee5e9a0eede9e4f5436b03d55cfaf6f34c48cbd347770711b0be8b +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27e0ed4015a21462335a14d6d4da938a8bfe0db7 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d01ea95b373ac0a3dfde493ad0f45539464a62a47e3e4575c4ac5f0bb5a8877 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c7390e067ab03744ab3a1341f792a919f2412d2 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dc2a2891498c9ec462c48fa3a95990867cf392ddea00d74f000848ba2694f88 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ddd54ca4d29e3886f1922c548771fd3b5e40f89 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a6993fa40e1dd76a5bc873b002d8e28087b36fed455818667320c3d450e5f13 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95326dfaa5a3ab35c1c29fabaf2d7b28a7b1c155 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9541db3f81fe5872bb4765288be1fd0a19958c634a7abd572731087584f95c38 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1cdfdf9351d0508c984ffaf4a2323bd8c4b2a45 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8b2982c0cf9fec869a2d2be12bdec554f2cfaf7edf5a719f4054413cef4ab5a +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b50f050c18eb0da1c3068c70159f053572e1dd0 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa724bf26eea79cff4b99faff2ed35783e914744950c61e95290b5e9f79cbef4 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c1cc6fadc44dbcd1fda958f471aa96386047ccb --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c43c0f1ab25161640fb254db7afa19a244ffd8a81a339dfe61e8f8419391065 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4272e363610795eb256dbba275cd70aaee9f71d --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:547f2666d7377fae58434911232b54d594e71556a6bb6f67c9d5eddbd5d5ab17 +size 199058647 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd2b9be75dd986a31030532a2ae1b67d2dc3fb40 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41a730efb35bff5354a346f13ee528cc14fe9274c54cd03923def20f9c0ddf85 +size 199058647 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f99d9c85a1f002d00cc39520176e695071d9ef9 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e9eeaf9080f2f3c1d014b63a5eee8bfc20e9a78965abfe4f1c2d501bc8dde9b +size 199058850 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a4e85e8ceae4a57c3b95de35c7026d0554acc4e --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4497481d154520069618815eb5539bb3d0441cd6acf68ffea4461a6cb2b7e418 +size 199058850 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..887203053192a721d985978090f720a2d656ebaa --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f51e0b7e1f34c387613677055f05d379c3c61af92d683570111a7d548c255e29 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fee964e736b138c3e42cbdfd169e5d0a344ad76 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87e95da4cb8646bbb4158222df07cdf9890f736db26081e6654a0cfbecf415a6 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81d113ea8540c48678f938f78899b1be66512c60 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52af52dc6b07f2857f88d90beb57a721f8817d53b424ec4d8acb6ee9033cc127 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c4c82323dc3deac64b0f2530c9e7735932f8267 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20d0e64a6b81aea29ac4652c5bb874c03d2493accd23cd07725ee2dc582865d7 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7febfae057b04067959d8fdcf08880057de5232d --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f6b57a83473c1dc064e7f4c597e3cac3c3bbe5eb03b47a049b3fa87ad2884b9 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dad6f182ce9a72edcdde80483301bb5ad7dd170c --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e5055a3abd85ad1bcfa8e3715fc9fb038d3628958690abd00bccaaea0f7feb5 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..641a41c67fd74e13118940fab1edfd3040664a4d --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d71a50eff4fb35654796ef6594cf6030885604536606624a191bcdbb3ba1304 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..056fce6088e74b0e3f98996fb4b1c0ef5078fca1 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:654aaf1e89575f9b8b056bac7ce78f473892d2c3abbb81d9a304506ee2359726 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..953c7a4e447e7e14b966be81c7ce28481f23d783 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:919939cc47e9bf73371bd540ce72a2f02d83584accd0d57265d2aa008b8fcc73 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57b23690bdecdb96f454b5dcfbf7d94d56a043db --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5998c8cfc9c13044849c8ccd954a32cf7f8a47ab3c2e7b7ad0289f00d4c22400 +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..787320819d8b100bfdaf8760fa438991027a4683 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7144d9774390ccf8cd539f38587a72d0c85f9913d6b0527b37c53003f0593a3e +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92be1f8ddea6235d394c35ce31842db144340d7e --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b08977d7b082860ecdbcab7561e785edbe535254f3a7a004936d2a5cc68ffab +size 199058722 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9576e83edee204c40f6690b242a7ac081d3e1e7 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af1adc2cadb89bc578ee3c95aa6a63f6f14356e6d6b286deda06a08441f0c193 +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..593f4fca4decd567220756a2dcf592ac4e9a4217 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fe122105ec3b09d3e0356cdce08053a3d382a3994aa0c52703e64de9c7a8dea +size 199058786 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec62faaa7b61c90738eb7f013f070c6475e20f2a --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67210406f6d413e3a1c2d59f210fa95eed68871497e2a167ca172c47e8a69b9e +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55e3022fda63d143603bc9203e63945c4e943e2d --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f175e193113ff89bd6837ecef9194064e1114033e5ffaf94c22b558a50137c8c +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08175a626b8901d40c8f1838e9e664dc4689aab1 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6959d75e8771b7150990f4b606da3c58a3d912a01a74fe5f030bdbec8b960c30 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..efb0745976354c9a3d63a505f710b2350dc3feeb --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abbb13b02223ed18845eb8b84b9d837065d2b9f8b9b0319b844bf1d23efe3182 +size 199058658 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e81be6889b79dc9bb1a26fdfef99e6d98a8073a --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89184c029cddccfc2243223a9a810f70a9ec33f3d9be7a361a8f6519faeb557a +size 199058839 diff --git a/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aec6505ab83443d7aeadadca37ab1de8fc3390f --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b220caabe02a02225e164ebd733bb4639b590f228baabe2aa89b1c51efd07ee +size 199058839 diff --git a/4b284b28bc4seed3/global_step80108/layer_01-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c15fabd0251d5d71f1c115ef7d3954a61964fec --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d67f45407a56b86a8b47add97d57b263ef2a07d69eb78e780ee6472ee2e7df73 +size 167511299 diff --git a/4b284b28bc4seed3/global_step80108/layer_01-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c123c38b3ab029a299c8f8f95ae1dfbac310e7d --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18849c96e5e3f2733223afcf8067553711211b86930e434fd2c7d24a9fbae7fe +size 167511299 diff --git a/4b284b28bc4seed3/global_step80108/layer_03-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a48099d19b08810860ffce8fa95ef857aa1ede8 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:057a2a93fd8832fe447335d3a7144e78611044ec78d1c199ccfc39806168c6c9 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_03-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f8703453bda6d5841ffe36e905c09e7f4155e1e --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09b48313ea23ae44628094c28c4d588a977466fe076d6f079af7ac9bc33b5cac +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_04-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f7af90ec9d3023fc937f4a04b1249e3e9e085a2 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:603385db781585312fa0213a6c0e40664aa14432e2c5098fb55fb249a83a797c +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_04-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe15b86d0d58bcaa230bd554aabbfbba97b7362d --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86219b6fc6e12a0d46bd1632f03995acc7391d3d32cfc0837f3f2d85e771ce3a +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_05-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..033b7c028cfecd7b8b5944e05e339fcda9c58b2a --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:967771d2218cb4654dfe7172f9c94b6eed1823add14b741b61b6b401e5fec013 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_05-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c287393831737b4cd6d5c588a0da207ee005ea88 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82c60ad33b907667d7407578c20ddfd951ce18cab66009fbf2ba1524b13a7791 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_06-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..004dcc7924eeda1da663318729d93f8d0fa95c3e --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fc22729a74fdb1110b59f7e75ccba80880b38b0b243c86bddabdbaac4fba520 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_06-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61311b5f23aa6231453cd7e4539f161dbcaf6489 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86137fd39569e4e8e77ab42428cc1ae1ae90b3952bc53446530913888aaa58b6 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_07-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..912fc332adb8eb75474db097aa249e9ff9069cc4 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8c8ac8785681d52bf84d40a93a9f38f670bc570d9bbc8abf9ef9e8f0f964f49 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_07-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f27a9958f434c23e3f2715254e2e1fedac069d6 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdca1398dfe16b6587b126490ae2227338e7d995f3bd348674be105422edf1a6 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_08-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91b4419c62da66392ea24df9b566483ffd1281e3 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:067e762193d1d9a3751ded98e5307207432d94ddc3422b8a5ce95593bf2ab5b9 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_08-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ebf29427db17537cc4c2b9db02ac8370d329187 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:836ea20a84e5271a5c9eab33b6da967b8ef7d3326bffca7b457614242d14e063 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_09-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39c011fe403f26368774a1b59233298777c345ba --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfd049c111087038cc646c51c50e689dc6acf5bdc9cfe49bbf0191a98219f989 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_09-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b2312bf43ea7fee8e4dbc9fada96871d812008a --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea812950ba4b5cd93147032d34c9ebc4ba638c0e0609763d54206caa73629a65 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_10-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a27ff6812d0f9127ab9f9e90f4e37ce88f0b6c0 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4c041e7dc64da7fe084890e5e6f5c5c134191a959609a1a005d378ea017e45b +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_10-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bbcc27559e1de90367dec34bf58d0e7e6442f9d --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ea563c1fb117a40097db8fc9904989cc43e2db6d06cfc0062608c3b4ce1e13a +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_11-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b36fb7da59bb4f5170d0be4ab25ea91edfcd4f9 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da7862849b486540303014efaf3b646125aee5cfda2cb3d8f17978fbcbf0ad52 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_11-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7b5cc4d0e28c4598873f5ebb6a5e0f47030dcf4 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73ca8d494be55b4d040143c845e33b7ccc04f9de902e3a4c0565f897b0315ad6 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_12-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..450953cd83afc1f328160eddd1f6212d5368eed7 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1098245e99b531230cc14a74e2b2dd894d044ac0130bf8a117a0f89ec4fb8bd +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_12-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa7118fed8dfe032960a7ed8f85293bf750741bf --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c74dd69b5206c78123b9cca7edb5136c856987d58186083cb6f31748fde737a5 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_13-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd3bdecfeecc21706518e18cb08699a338dfd24e --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92665e3e41ea6fcf172eee07843546c1cbf055028775fcb453298c5101e52aab +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_13-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de195135372786fb8751637fea8d10028ab50c1e --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0f4fa92dc362e096110a14edbf9044802f0c7f3f49cdd491864a1a14ecfcac1 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_14-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f51454800fd80f9e9aac24d11df692d33f7f5a2 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef431eb1e68eec500a5b7ee276a9232007c1bec5cf3ce47d73111047c4021369 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_14-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..529ee14a157d246b866257eb7656f5736a9e02dc --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e1c46cc5334a4299b90ec3d140bad89c56aea51a0f349bd26ff758293653931 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_15-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e58594e49edbef1bad0fef8b27d14a04ead1b322 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b5ffd020a00c377f9ea98014ad4483d29f2da80c108ca1d457fe97684e9cd07 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_15-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a34ce7b48ffe5e7b5866fdb8f04658079aeb1ab --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99dbf79428387f09375c9108c8b75026f6558561a84cd3de7fef81226008d5a4 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_16-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d35ba9dde5811e4c678586ef16e6edbf16b32575 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a349152c04927290b6236477fc1a837bc9aa01292d4fd355f1ccd8dc755f6f60 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_16-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b2c3da84cd48017038086866debbcd7a73a7c2b --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e2efe70467498c5402cb2df732abb71d71d63879deb9a4d7ac4f202a8491eba +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_17-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80141f7ee682f285522713c613918cfea46a5f83 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c5f62c91f8ad196c950efdb71dddf00553c0ca13efd1b07524bde7f9a2789ec +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_17-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46d28a55c34378cacd922a508c9f3a6658f59dfb --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d8db83308cec72d2bf1536149c152fa9f5616efd98a1b979cc52d2188e108c6 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_18-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5ea1240634e92c5c0bfd78ae8381d621c83a12d --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:304193a84b7af51c6403bda7c12146387336a49c6b9e1e058e26be960f5453b0 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_18-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c6d86d3ccc47e52bf3dd2357944aaa9c07817cc --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b191072831914ae20865ec12367798d21b640c00dffeb1e82397461def02c19c +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_19-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27d166ddbbf736adfb0ee884e1e5371654f15056 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea2db112334ea857d2a10c421ea4411a1e78e416257cb39796db598d291e2b81 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_19-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20f9f64c7181d417c0d680106ee07cc4963435ab --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e2d190715805b80734678468298f2c659718f41c597b458d612e85fcc179545 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_20-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67be4478aa3683a968ef6577815415ebf400a446 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d517d9edb8b1cf0db6a8c36055ac7e7d9dc6883dcae2e900690310d0556c89 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_20-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccf8752f2a0de9e23912c97292f7e69f4bdc1ccc --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf2bb601284145ec68d7fee72b485bb833a58ec675afe9dc509df629bbc0d123 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_21-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..396944ba39ef2b9566ecbda6d498150ee9447112 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e79ee52bdf0a5b84267626f0b0dc871ba9453507666ffa10830c2f87faebe04 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_21-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..155ef8d8bdc49fd474cea9a5da05248713694e98 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04865fb9684fbbcaf1e70a4ee6a795575f26572ce1eb9b840dd7a687b0f7ee3 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_22-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5be86e1934cda32ab5957b3c6c597c392022991 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:875c646b60678e5224ee0b3693b2feb007ac32005413d0423fe3fbba2e1917cb +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_22-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1dfe632daed97c82cf5b85e7ee8b890ed165842 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80686f6f88409dbf154508213a605b02b2c0dd8c252da800cc3685d1f7d3d206 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_23-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea8d86acfd03395e33ef92dcc57e36cc506534bc --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9407b76d3527e0d92eefc9b77b7fef46a88221cb8881ecf6908d68a69db8da1b +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_23-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fd30610430ef161f24a696b110ea2e9f9ef0f70 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2287ffe38ed9e6afd8b0281db791a6c6df517d88b7327be5f34cafcf72a8ec77 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_24-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30d86d0f9d606f32b4bd389e41b9729df4402899 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5213b41f59c08b907845d874ea62613083d85c1274b3fe45432b2fd20741a2e +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_24-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8b50dd09f54f75ce3714b27c1f106fcd21efd9d --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11afa4ba34898f2d06bc03db5b724775b191ed8a023987778469dd3d3d236c08 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_25-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4ad5421b14769762cfed8b03e3a4dd720849b4e --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f8a2130e77aec889ca0bbec23fc7b072e3dafa7d655c6b2a7e8070863851c93 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_25-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7902284468f5701e66b2edcc8e323f1b6098073f --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:789f8cd593f11764dcb879a670862a55985e97b3c1a8a5fc2571f796242a744d +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_26-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a5f4141b5da9927a1ab8492469601946869c463 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecd06434a2e91263a244e861aacc36a8bd5ad6ca8717bcf1b2e5ae503d520ca4 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_26-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1bfe491d023a4553fde616e250a8df1b4e0e553 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ede928f1170eb39d34a057c8f47b267732790bee7c70721e245b5050b4a08baf +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_27-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df6561ea04ad70a1a13bd21abb0afa1695093f2d --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:941a076bb19782d629894b1006d8be336e3b265275cea8af34e213a4754ffd1f +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_27-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50e43ce1806bc54ac8d89487900f0cd1b8f4996b --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1215dfd70e7e85cd3597914b360b7d7605e63f92b77b567c57568d8f6754a4e7 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_28-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fc9f25645da391453b4962ea76b53aaa7e8c9af --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17ea5df8a1ed3cfb420b5a2aa900da04152e4b510afec082bccc8b1f0859884f +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_28-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af248293b6eab6a54704785842f1266194a0d88e --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:571b358db3db294731f349ce2ac9c3fbd631b65ff45186fd38d08595559f450c +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_29-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2ff0d867502ba5a301635e2a4c0c9982e26efb7 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7664dc868dabbc54ab4cf78c7b85e08d18af1e5cafa2af220dd5795089ba15c6 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_29-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fd57662d7e95f5b5fcfbf7783f30de6dd6e7845 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5e3891cebccf7b1ebdadfea969cc605918ada48a619e931f2ad6b322ad38dfd +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_30-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4760fdc1be130ee4aa5e3311e513ede0ff4d952 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1da5b7e365a56ddee70e25b3ead69e84203312d3705a7c88e79b3c2c9097607 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_30-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a547431ce9afe8c8e57fd186e9387e3891e0aa68 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b659b5c2631124ba524b7e5d42159a245588d155f0426bacdc08e3b36a96600 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_31-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc90c77f937d23188279ad6530b2aee82da6df82 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:853b9378b9c6bbd261d436a51e58d6ba1b2df27d40da91cc739b4f291c5863d9 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_31-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcd8ed98fea8de9b35a3ae509e6121a241a151de --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:517f0cc951606daa3c64ca9052771cb6f931ae5dd669608375eac66fab4efbcf +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_32-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70c9a35d59357d41986a3a89204fa51248481408 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:499fc114fd642bb0b1144201217b8c33713c58d5a302b2af192a3fd9b8205c71 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_32-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87ac2a96a4bcba36100fab69fe8b0c167ba32012 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2b2e94db21b024b8a00bccf0ab4418f734245fd81c0fcca1fe06e34863f2972 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_33-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e42774ad3c66ca47a4990bfbaff76580748a2db1 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26b3f091f8349d4d1014c26d2753aecf3a49d65f2a1a9caa709e1110d499bd11 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_33-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f1f91f977dcfb72413d6db4c9babbbb27114cb5 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0355c54515124b5c5d4d64f3416fe912fa2e45eb881e98297bb1f1ad8992b44e +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_34-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e968233235736f976719add0aa19025f0bc608ab --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bef1f85a6cb875a4b26ff4607aa8667f2a50ddbe8febf33733ba7cede478e100 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_34-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e7ccea1dd6af626dd3651efd676a232dc7500f8 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20bece609990fb19272d778fc3a2551cdc8c9a061ec6073f533419a6b4166e1c +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_35-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..749643ae51ff70fb7963ed503b4b8a2e98b21022 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01e542c45132770bfafdaf698acce2ff4e370c572c1bbad7af79c446b215299d +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_35-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..efe7df75b360238cac8c2e17f75f24077c483539 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b522127c1e314e6cdc484724f98aa200a3f3ec97cf5db2e69de2a4c5f722fc69 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_36-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..251935c4b75f525e55be22f5dda578bfafe612f0 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9a3d71ba69e0b9d30feb68a08e3a8280f6d1a45b7f0799b30cf8de6d70e929c +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_36-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7377dfb3d2fcec294207134d7a6b5a6e026f087b --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22dbe9020e4c28bf680eb2221ade38fc2c4ef8926d27f2cda743b16916267c3e +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_37-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9519d70e3c5d367e9fdcfdf3e30926719e008f9 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b5b6eca87c91cea4fdfca88447aec15ce607195b23aecca16a857f6373cd77b +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_37-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e70d575f1c6f64bc500f4d73c4a092696463b16 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7912dd4eb75d032040cad9b618b8b869ce5dba46b774c3d6be223694a13a92b8 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_38-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8298c5172aa815ae32a42173d721786bbd98297 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:589bdb929eccc59e87fa0e8228043b26c6b49831761503895e0d3401d0cb347c +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_38-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dc0ae0274537fa324d8cb6120764e95bec9384c --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebba4a98e7ba8f15885235cbe5b61ca549c6f92d6c87f79e0cf7f386ee404bb1 +size 113308931 diff --git a/4b284b28bc4seed3/global_step80108/layer_40-model_00-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..441528fe80941f5745d82d65627ca1f288578933 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d168c8460d9d56a6e438d03507286df5823221d27db166e6ec02d8d39a0c418 +size 13507 diff --git a/4b284b28bc4seed3/global_step80108/layer_40-model_01-model_states.pt b/4b284b28bc4seed3/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a783fc020d2ed5710fac1a9f1765c1e0dded2504 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:589bd251519ba7b5a557b25832af1da268f96c04c12a94e8ffd266159a1f012c +size 13507 diff --git a/4b284b28bc4seed3/global_step80108/mp_rank_00_model_states.pt b/4b284b28bc4seed3/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a12bd5e5738573655bd10d400db86d349720bae --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e55d38dc23f9877ed4f01f7b39b5d0c629112e2371174ba762c3669ed68aa32 +size 51507 diff --git a/4b284b28bc4seed3/global_step80108/mp_rank_01_model_states.pt b/4b284b28bc4seed3/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..386632da213108c48dfefad4ffed95ff6fb23d27 --- /dev/null +++ b/4b284b28bc4seed3/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13ece52fc8fa668702d6b1c8649d8c32c7dc089792085c616fc7e039c0548c7a +size 51507 diff --git a/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..65b0480d262e71e4a03d9e8df8627e3c73841520 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.31620109957758985, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0436977639970438}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06769961049671226, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014408731719188182}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2867407372924206, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004571157006568459}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10315902016726786, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019060070438482958}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.031623473816054536, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008563816673904925}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.14002477235273347, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0030829927271468455}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.048680633498613235, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012001070226091816}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06551735699492812, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001360472354290908}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.27974078406805947, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004483148560424672}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10001471836261917, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018101971022073298}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06504923908690437, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013793228194582826}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2754429077514643, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00433299850418606}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.09908745681833024, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001816434962081851}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..c7c15e3f0a6eeef0a616192689f594e3a49fce37 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.4465798489958593, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03821208721897477}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07371823857673165, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013763349225185478}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3688809731011637, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005115562578388885}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11510221349692805, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018417715919236185}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03378602637117124, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000831107209277974}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.17620010741543168, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0034569647317057232}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.053026565677639095, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011718066518224836}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06938216236815531, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012090035216715325}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.34811809237457786, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004687691743161809}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10846810658720578, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016257087585928257}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07050615181309323, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012933152319356035}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3514069079411779, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004710020922149002}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11005414089372284, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017281404618979693}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..0f00da5e732eb32d92acf7b3e71bb94ea6ebf715 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.49390694019851883, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03283528773113811}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07053978792457792, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012141148921630063}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3722085841928087, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004932224410126405}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11167166378709677, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016694573474676788}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.031882639973859254, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007440437082987532}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.179162100861545, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0036067927027667616}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05071036081345163, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010731951740562927}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.0662695912572972, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001111137879131896}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.34634376427492525, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004426222539040666}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10482960375745125, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015367324295981716}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06731544242555773, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011479427958618216}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.35393011607524494, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004611169262021209}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10651850585213189, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015844678024154568}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..3f1902332291698669ac384a6e200281e1f5a70b --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.146341713551491, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001907488992714226}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.24303710279927596, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026740629162863815}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.16981770764951246, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018844380426673607}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.030255907844947725, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007661823292966557}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0524686714748099, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0013880458970171093}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03548853418089557, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008596537307285957}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11563887486905755, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001369806180194911}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1990169050957429, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00219255306093255}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1358656284421895, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001389903118786626}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.13357747346540397, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017299539524552423}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.22314380798385272, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0024794181108329524}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.15524577102172657, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017126012169208825}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.60885283648322, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.046404803775343256}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..8dc78488dc74ef9648f9654198620e381f8c33b8 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.19152350230841855, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0023810619465519586}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.302694565096085, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002871626633712586}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.21273278313561203, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002011144383038581}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.04768841739901736, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0012211060679656308}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.07569607558899676, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016977441994545117}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05180034750467234, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010557187582866223}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.13653437043291017, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001724532681214248}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.22191488232376044, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022628821878105465}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15200924118476186, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013679053352126194}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.17974451166450459, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0022478628561453545}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.28504093466511404, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027223245492742462}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.19969478957091424, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018860691826304264}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.725412897374069, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06590713364460175}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..cefadf6238b0fa8c8e1e780c431ab799d2021d57 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.21412338509678533, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0028281010919592436}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.30461283300382674, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002825271119088337}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.21977815129794487, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019325468923461176}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.05888063726692182, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0017538775810198863}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0782305781107223, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001697698646970674}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05616050870223023, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011252548440132944}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.15547333657821524, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0023132587548469795}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.22142616128174153, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022228357872264405}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15708445866755325, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013652347675896105}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.20218982558840237, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002724146894044121}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.28724184959573407, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002676027470194893}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.20703520109346182, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018184636268796823}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.0660991212944317, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10372713065464424}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..b86c3081a6eb69c6eb05312f00ea134cc15d6368 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 0.9486318659821757, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.046054186708753594}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.05127435604947866, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0010816160215933884}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.09809462257860511, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.001988448826829593}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.06647296884394631, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0013703971424785793}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.009013651576884465, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0003983827007173943}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.017566860336679598, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0007876531254085971}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.011764220975410813, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0005194241761303413}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.050780395408484696, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001064268150921614}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.09725254219294728, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.001963943905207662}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.06585835855034873, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013503477728497991}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.04328842801917388, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0008811589017402656}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.083491757226437, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0016470232472348585}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.05626251970787973, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0011217151771389764}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..394a25066730c896ce8980a558c7ee61a219a90e --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 10.736417414826192, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.12883315690574576}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4994281816248813, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00315562260432105}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4074682552684028, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028860632451414964}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.42347669756200107, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002299761985015768}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.22810495987567186, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0024574603360052174}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.1831102494700893, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002053236226953995}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.19063915520224362, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001908484563894186}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3668088539701383, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0027243573366763025}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.29737795551223317, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023390292209083986}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.30934327771314435, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019536593166029873}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.41086699735293175, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00298010231762013}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.33421135617493986, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026325643111599697}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.34772596056303123, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022228086994649674}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_gem_xsum_article_DOC_summary_0.json b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..148c74616d106b8a750b3e63d6af2e02c649bafa --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1690176511800054, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0025057503766924764}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3169600025152783, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004390086610875057}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.20850602933405124, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025783509188228872}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.035231821829655605, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0014122236080052043}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0721669404414664, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0026942676554950196}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04480106981761703, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0016469393826685948}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.1276621204119681, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019441096332612402}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.24175632866951158, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0035366671887579804}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.15783763779709026, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020045338016978164}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.13096994127744102, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002011329849282318}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.24916483206303525, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003801039212088291}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.16234750057160516, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021521921302323334}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.022928782196655, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06323504041482224}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_gem_xsum_article_DOC_summary_1.json b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..860dbb293f73f875622f9b9e55c0fdbacc402bb9 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1208560729467065, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018331156830519264}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3011735743290485, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004262574821709688}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17053066710298548, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00248505468489638}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.023321914774610174, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009490899905683155}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06000231967162931, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002490214577848948}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.033207183560968925, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001348828018973971}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09381616328217902, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013434290825839483}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.23579210005809345, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0033043055105988852}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13262019002149206, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018340910251430245}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09660547186408498, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001445839504863143}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.24312964604533158, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0035600019821752133}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13665130703802245, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019843002642716883}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.3013783094677602, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05323851494545823}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_gem_xsum_article_DOC_summary_2.json b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..8e7a72fb30f7bf2970ebc724875eade02a71bee1 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/agg.4b284b28bc4seed4_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12496533702098848, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017902842566202737}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.31218014639465674, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004202785523007602}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17640095609918918, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024236476790657165}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02572420280473422, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010068612303705702}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06686357551325348, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002695792942377374}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.036694425298060884, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001436730910285075}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09783615822934287, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013714730714619002}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2462675293448225, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0033637471659569394}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13833597033877038, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018696740518708518}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0994096762980347, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001470776129912826}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.25080300299758923, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0036598233956450744}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14067838491016335, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020231190670618898}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.4610227609434248, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10327228234775739}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..66cd8c6a7ff4501ecf42bba387b0cc8b96cc529c --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:639ebc132aaa7a4d4e4f2efcb1ab11a2a5ce26d96d9287c2a6ecee4091b4eca3 +size 4113566 diff --git a/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..11599bd74ca43c87e5b11997740ec41dbd7fb82a --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0eb071a7820a402e77cb334c01bc76df24fbc8499922b5dd306c62840584b0d6 +size 5112331 diff --git a/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3ea2699fa8402974bdfce74cf66bd5885746b041 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae2cff1f94e2a505df930131de0de5e54b0964ca527024e2e9f33ae803b4d068 +size 6038080 diff --git a/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..9c19afad1404716e45af2d3798bdb444b02e1eb0 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d4b54bda6bbdb8c3b70584203627e92c3fdb9f5091219a90c156d88d162f3f +size 7665869 diff --git a/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5a08c5a9ee5ee69f950eca05c86243c8a809d39c --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:079240cc4a89c2f62092107df15480da16c668872c3d07ea312db5bd5d048cb1 +size 13293513 diff --git a/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e0b0ef63d6a8b5068beb534d45ed5c163329dc86 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:872043556397153a239580ebeb1be89826e99c1bf88350be2c81558c2d35308a +size 18873213 diff --git a/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3f019ba87d24d15dca8bb3cb47e92a282e9be5c2 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e80378264edc6c6acbec2f75cea4f2e55559d9bf405ae489fa9774c742057e1 +size 4538303 diff --git a/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..eda43db1d3c2006978231f945e7b5511cea60ddc --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b31ad8738924569dd4ae7141bb23f6a07573eda9500b2cba7281aed7ec34706f +size 5046307 diff --git a/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_gem_xsum_article_DOC_summary_0.jsonl b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2f7b25611a4cdae3db4216ebc23865e7db0d5a98 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:219feea60cae2c538a4c30c2dbf7695b86f1ebf50bd9550bef2d15a10b2abff9 +size 2776844 diff --git a/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_gem_xsum_article_DOC_summary_1.jsonl b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..30b74e3208d2339a1e5b566f628a5ca6f4905a7b --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30b3c67cc67031c709cf8831db22e60408d1ea8de3b344747146918c5e5b949e +size 5106634 diff --git a/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_gem_xsum_article_DOC_summary_2.jsonl b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1f164539b5f983c8deeb32c0ec68aa73ffc92a50 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/examples.4b284b28bc4seed4_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03c6e010b7245f6338e9afb02f7bd349ed46707f2efb3c64276a5397906317eb +size 7378313 diff --git a/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..f7e86e3e3191155bc81e7342c26de925b0b82f4f --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.31620109957758985, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0436977639970438 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06769961049671226, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014408731719188182 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2867407372924206, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004571157006568459 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10315902016726786, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019060070438482958 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.031623473816054536, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008563816673904925 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.14002477235273347, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0030829927271468455 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.048680633498613235, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012001070226091816 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06551735699492812, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001360472354290908 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.27974078406805947, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004483148560424672 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10001471836261917, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018101971022073298 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06504923908690437, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013793228194582826 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2754429077514643, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00433299850418606 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.09908745681833024, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001816434962081851 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..ae48baa85075fad8ed1e0f27a986d765e48c2abb --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.4465798489958593, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03821208721897477 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07371823857673165, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013763349225185478 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3688809731011637, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005115562578388885 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11510221349692805, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018417715919236185 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03378602637117124, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000831107209277974 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.17620010741543168, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0034569647317057232 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.053026565677639095, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011718066518224836 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06938216236815531, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012090035216715325 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.34811809237457786, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004687691743161809 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10846810658720578, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016257087585928257 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07050615181309323, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012933152319356035 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3514069079411779, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004710020922149002 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11005414089372284, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017281404618979693 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..72b70f87a7ec102f981798021aff3c61e6ef71ae --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.49390694019851883, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03283528773113811 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07053978792457792, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012141148921630063 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3722085841928087, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004932224410126405 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11167166378709677, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016694573474676788 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.031882639973859254, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007440437082987532 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.179162100861545, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0036067927027667616 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05071036081345163, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010731951740562927 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.0662695912572972, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001111137879131896 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.34634376427492525, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004426222539040666 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10482960375745125, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015367324295981716 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06731544242555773, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011479427958618216 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.35393011607524494, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004611169262021209 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10651850585213189, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015844678024154568 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..c04900d03268a1dfbe53985cd927c72d6ac60d70 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.146341713551491, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001907488992714226 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.24303710279927596, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0026740629162863815 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.16981770764951246, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018844380426673607 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.030255907844947725, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007661823292966557 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0524686714748099, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0013880458970171093 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03548853418089557, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008596537307285957 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11563887486905755, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001369806180194911 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1990169050957429, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00219255306093255 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1358656284421895, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001389903118786626 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.13357747346540397, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017299539524552423 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.22314380798385272, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0024794181108329524 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.15524577102172657, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017126012169208825 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.60885283648322, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.046404803775343256 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..883fe21239254724134b9bb927471ca372613455 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.19152350230841855, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0023810619465519586 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.302694565096085, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002871626633712586 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.21273278313561203, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002011144383038581 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.04768841739901736, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0012211060679656308 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.07569607558899676, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016977441994545117 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05180034750467234, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010557187582866223 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.13653437043291017, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001724532681214248 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.22191488232376044, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022628821878105465 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15200924118476186, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013679053352126194 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.17974451166450459, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0022478628561453545 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.28504093466511404, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027223245492742462 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.19969478957091424, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018860691826304264 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.725412897374069, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.06590713364460175 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..81f7843c4bf9fa93b2564189f2003601801a88c4 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.21412338509678533, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0028281010919592436 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.30461283300382674, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002825271119088337 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.21977815129794487, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019325468923461176 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.05888063726692182, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0017538775810198863 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0782305781107223, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001697698646970674 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05616050870223023, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011252548440132944 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.15547333657821524, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0023132587548469795 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.22142616128174153, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022228357872264405 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15708445866755325, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013652347675896105 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.20218982558840237, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002724146894044121 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.28724184959573407, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002676027470194893 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.20703520109346182, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018184636268796823 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.0660991212944317, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.10372713065464424 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..158de1429cca9d825691bc663233a18941d73b3d --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 0.9486318659821757, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.046054186708753594 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.05127435604947866, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0010816160215933884 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.09809462257860511, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.001988448826829593 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.06647296884394631, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0013703971424785793 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.009013651576884465, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0003983827007173943 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.017566860336679598, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0007876531254085971 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.011764220975410813, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0005194241761303413 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.050780395408484696, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.001064268150921614 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.09725254219294728, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.001963943905207662 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.06585835855034873, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0013503477728497991 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.04328842801917388, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0008811589017402656 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.083491757226437, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0016470232472348585 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.05626251970787973, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0011217151771389764 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..a491caddfc922d236c9cd5bcd6e42266ab8090e2 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 10.736417414826192, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.12883315690574576 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4994281816248813, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.00315562260432105 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4074682552684028, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028860632451414964 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.42347669756200107, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002299761985015768 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.22810495987567186, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0024574603360052174 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.1831102494700893, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002053236226953995 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.19063915520224362, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001908484563894186 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3668088539701383, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0027243573366763025 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.29737795551223317, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023390292209083986 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.30934327771314435, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0019536593166029873 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.41086699735293175, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.00298010231762013 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.33421135617493986, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026325643111599697 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.34772596056303123, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022228086994649674 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_gem_xsum_article_DOC_summary_0.json b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..9031e99f037dc920d194f5f44a7fea6328f647e7 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1690176511800054, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0025057503766924764 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3169600025152783, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004390086610875057 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.20850602933405124, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0025783509188228872 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.035231821829655605, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0014122236080052043 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0721669404414664, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0026942676554950196 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04480106981761703, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0016469393826685948 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.1276621204119681, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0019441096332612402 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.24175632866951158, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0035366671887579804 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.15783763779709026, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0020045338016978164 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.13096994127744102, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.002011329849282318 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.24916483206303525, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003801039212088291 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.16234750057160516, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0021521921302323334 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.022928782196655, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.06323504041482224 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_gem_xsum_article_DOC_summary_1.json b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..2fe33328a44c3f12e3593f0ea76a6af5f2fb1c14 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1208560729467065, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018331156830519264 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3011735743290485, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004262574821709688 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17053066710298548, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.00248505468489638 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.023321914774610174, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009490899905683155 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06000231967162931, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002490214577848948 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.033207183560968925, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001348828018973971 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09381616328217902, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013434290825839483 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.23579210005809345, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0033043055105988852 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13262019002149206, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018340910251430245 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09660547186408498, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001445839504863143 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.24312964604533158, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0035600019821752133 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13665130703802245, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0019843002642716883 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.3013783094677602, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.05323851494545823 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_gem_xsum_article_DOC_summary_2.json b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..c212518969cee9eb283ee0778c57a699c5d29390 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/generation/slim.4b284b28bc4seed4_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12496533702098848, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0017902842566202737 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.31218014639465674, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004202785523007602 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17640095609918918, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0024236476790657165 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02572420280473422, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010068612303705702 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06686357551325348, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002695792942377374 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.036694425298060884, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001436730910285075 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09783615822934287, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013714730714619002 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2462675293448225, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0033637471659569394 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13833597033877038, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018696740518708518 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0994096762980347, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001470776129912826 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.25080300299758923, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0036598233956450744 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14067838491016335, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020231190670618898 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.4610227609434248, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.10327228234775739 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b28bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_0.json b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_0.json new file mode 100644 index 0000000000000000000000000000000000000000..6129d8090c05dd83c83215a3682e3bd3635f1d28 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.325, + "acc_stderr": 0.014818724459095526 + }, + "anli_r2": { + "acc": 0.329, + "acc_stderr": 0.014865395385928367 + }, + "anli_r3": { + "acc": 0.3325, + "acc_stderr": 0.013605417345710528 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.3156716417910448 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.476000796654053, + "acc_stderr": 0.00498403025050729, + "acc_norm": 0.6229834694284008, + "acc_norm_stderr": 0.004836486437527274 + }, + "rte": { + "acc": 0.555956678700361, + "acc_stderr": 0.029907396333795987 + }, + "winogrande": { + "acc": 0.5880031570639306, + "acc_stderr": 0.013833112857645938 + }, + "storycloze_2016": { + "acc": 0.7172634954569749, + "acc_stderr": 0.01041380648612127 + }, + "boolq": { + "acc": 0.591131498470948, + "acc_stderr": 0.008598573693259113 + }, + "arc_easy": { + "acc": 0.6039562289562289, + "acc_stderr": 0.010035580962097944, + "acc_norm": 0.5429292929292929, + "acc_norm_stderr": 0.01022189756425604 + }, + "arc_challenge": { + "acc": 0.28668941979522183, + "acc_stderr": 0.01321498632927478, + "acc_norm": 0.2986348122866894, + "acc_norm_stderr": 0.01337407861506875 + }, + "sciq": { + "acc": 0.857, + "acc_stderr": 0.01107581480856704, + "acc_norm": 0.764, + "acc_norm_stderr": 0.013434451402438676 + }, + "piqa": { + "acc": 0.749183895538629, + "acc_stderr": 0.010113869547069044, + "acc_norm": 0.7682263329706203, + "acc_norm_stderr": 0.009845143772794046 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_0_lm-eval_global_step80108_2023-02-15-11-04-05_0shots_backup.json b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_0_lm-eval_global_step80108_2023-02-15-11-04-05_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..6129d8090c05dd83c83215a3682e3bd3635f1d28 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_0_lm-eval_global_step80108_2023-02-15-11-04-05_0shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.325, + "acc_stderr": 0.014818724459095526 + }, + "anli_r2": { + "acc": 0.329, + "acc_stderr": 0.014865395385928367 + }, + "anli_r3": { + "acc": 0.3325, + "acc_stderr": 0.013605417345710528 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.3156716417910448 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.476000796654053, + "acc_stderr": 0.00498403025050729, + "acc_norm": 0.6229834694284008, + "acc_norm_stderr": 0.004836486437527274 + }, + "rte": { + "acc": 0.555956678700361, + "acc_stderr": 0.029907396333795987 + }, + "winogrande": { + "acc": 0.5880031570639306, + "acc_stderr": 0.013833112857645938 + }, + "storycloze_2016": { + "acc": 0.7172634954569749, + "acc_stderr": 0.01041380648612127 + }, + "boolq": { + "acc": 0.591131498470948, + "acc_stderr": 0.008598573693259113 + }, + "arc_easy": { + "acc": 0.6039562289562289, + "acc_stderr": 0.010035580962097944, + "acc_norm": 0.5429292929292929, + "acc_norm_stderr": 0.01022189756425604 + }, + "arc_challenge": { + "acc": 0.28668941979522183, + "acc_stderr": 0.01321498632927478, + "acc_norm": 0.2986348122866894, + "acc_norm_stderr": 0.01337407861506875 + }, + "sciq": { + "acc": 0.857, + "acc_stderr": 0.01107581480856704, + "acc_norm": 0.764, + "acc_norm_stderr": 0.013434451402438676 + }, + "piqa": { + "acc": 0.749183895538629, + "acc_stderr": 0.010113869547069044, + "acc_norm": 0.7682263329706203, + "acc_norm_stderr": 0.009845143772794046 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_1.json b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_1.json new file mode 100644 index 0000000000000000000000000000000000000000..ceecf8cb7d5ab2b2b57632a3be821caf84975453 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.328, + "acc_stderr": 0.014853842487270336 + }, + "anli_r2": { + "acc": 0.326, + "acc_stderr": 0.014830507204541028 + }, + "anli_r3": { + "acc": 0.3491666666666667, + "acc_stderr": 0.01376707539507725 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.06737697508644648, + "f1": 0.3421052631578947 + }, + "copa": { + "acc": 0.8, + "acc_stderr": 0.04020151261036845 + }, + "hellaswag": { + "acc": 0.47470623381796456, + "acc_stderr": 0.004983392650570958, + "acc_norm": 0.6215893248356901, + "acc_norm_stderr": 0.00483999574560232 + }, + "rte": { + "acc": 0.5631768953068592, + "acc_stderr": 0.02985524739031495 + }, + "winogrande": { + "acc": 0.574585635359116, + "acc_stderr": 0.013895257666646382 + }, + "storycloze_2016": { + "acc": 0.7167290219134153, + "acc_stderr": 0.010419760409155363 + }, + "boolq": { + "acc": 0.5935779816513761, + "acc_stderr": 0.008590531708882184 + }, + "arc_easy": { + "acc": 0.6178451178451179, + "acc_stderr": 0.009970747281292436, + "acc_norm": 0.5824915824915825, + "acc_norm_stderr": 0.010119187377776038 + }, + "arc_challenge": { + "acc": 0.29436860068259385, + "acc_stderr": 0.013318528460539422, + "acc_norm": 0.30631399317406144, + "acc_norm_stderr": 0.013470584417276511 + }, + "sciq": { + "acc": 0.902, + "acc_stderr": 0.009406619184621243, + "acc_norm": 0.864, + "acc_norm_stderr": 0.01084535023047299 + }, + "piqa": { + "acc": 0.7513601741022851, + "acc_stderr": 0.010084511234296859, + "acc_norm": 0.7568008705114254, + "acc_norm_stderr": 0.010009611953858914 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_1_lm-eval_global_step80108_2023-02-15-11-04-05_1shots_backup.json b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_1_lm-eval_global_step80108_2023-02-15-11-04-05_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..ceecf8cb7d5ab2b2b57632a3be821caf84975453 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_1_lm-eval_global_step80108_2023-02-15-11-04-05_1shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.328, + "acc_stderr": 0.014853842487270336 + }, + "anli_r2": { + "acc": 0.326, + "acc_stderr": 0.014830507204541028 + }, + "anli_r3": { + "acc": 0.3491666666666667, + "acc_stderr": 0.01376707539507725 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.06737697508644648, + "f1": 0.3421052631578947 + }, + "copa": { + "acc": 0.8, + "acc_stderr": 0.04020151261036845 + }, + "hellaswag": { + "acc": 0.47470623381796456, + "acc_stderr": 0.004983392650570958, + "acc_norm": 0.6215893248356901, + "acc_norm_stderr": 0.00483999574560232 + }, + "rte": { + "acc": 0.5631768953068592, + "acc_stderr": 0.02985524739031495 + }, + "winogrande": { + "acc": 0.574585635359116, + "acc_stderr": 0.013895257666646382 + }, + "storycloze_2016": { + "acc": 0.7167290219134153, + "acc_stderr": 0.010419760409155363 + }, + "boolq": { + "acc": 0.5935779816513761, + "acc_stderr": 0.008590531708882184 + }, + "arc_easy": { + "acc": 0.6178451178451179, + "acc_stderr": 0.009970747281292436, + "acc_norm": 0.5824915824915825, + "acc_norm_stderr": 0.010119187377776038 + }, + "arc_challenge": { + "acc": 0.29436860068259385, + "acc_stderr": 0.013318528460539422, + "acc_norm": 0.30631399317406144, + "acc_norm_stderr": 0.013470584417276511 + }, + "sciq": { + "acc": 0.902, + "acc_stderr": 0.009406619184621243, + "acc_norm": 0.864, + "acc_norm_stderr": 0.01084535023047299 + }, + "piqa": { + "acc": 0.7513601741022851, + "acc_stderr": 0.010084511234296859, + "acc_norm": 0.7568008705114254, + "acc_norm_stderr": 0.010009611953858914 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_2.json b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_2.json new file mode 100644 index 0000000000000000000000000000000000000000..7493e8b9a808beb1303470e4845a747a7185774c --- /dev/null +++ b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.322, + "acc_stderr": 0.014782913600996653 + }, + "anli_r2": { + "acc": 0.349, + "acc_stderr": 0.015080663991563098 + }, + "anli_r3": { + "acc": 0.3233333333333333, + "acc_stderr": 0.013508372867300219 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.2588235294117647 + }, + "copa": { + "acc": 0.82, + "acc_stderr": 0.038612291966536955 + }, + "hellaswag": { + "acc": 0.4731129257120096, + "acc_stderr": 0.004982561815214124, + "acc_norm": 0.6232822146982673, + "acc_norm_stderr": 0.00483572890373141 + }, + "rte": { + "acc": 0.48375451263537905, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.5974743488555643, + "acc_stderr": 0.01378286683170305 + }, + "storycloze_2016": { + "acc": 0.7172634954569749, + "acc_stderr": 0.01041380648612127 + }, + "boolq": { + "acc": 0.6128440366972477, + "acc_stderr": 0.008519429207594416 + }, + "arc_easy": { + "acc": 0.6245791245791246, + "acc_stderr": 0.0099362185271143, + "acc_norm": 0.6052188552188552, + "acc_norm_stderr": 0.01003003893588359 + }, + "arc_challenge": { + "acc": 0.29266211604095566, + "acc_stderr": 0.01329591610361943, + "acc_norm": 0.3302047781569966, + "acc_norm_stderr": 0.013743085603760427 + }, + "sciq": { + "acc": 0.914, + "acc_stderr": 0.008870325962594766, + "acc_norm": 0.889, + "acc_norm_stderr": 0.009938701010583726 + }, + "piqa": { + "acc": 0.7453754080522307, + "acc_stderr": 0.01016443223706049, + "acc_norm": 0.7611534276387377, + "acc_norm_stderr": 0.009948120385337484 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_2_lm-eval_global_step80108_2023-02-15-11-04-05_2shots_backup.json b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_2_lm-eval_global_step80108_2023-02-15-11-04-05_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..7493e8b9a808beb1303470e4845a747a7185774c --- /dev/null +++ b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_2_lm-eval_global_step80108_2023-02-15-11-04-05_2shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.322, + "acc_stderr": 0.014782913600996653 + }, + "anli_r2": { + "acc": 0.349, + "acc_stderr": 0.015080663991563098 + }, + "anli_r3": { + "acc": 0.3233333333333333, + "acc_stderr": 0.013508372867300219 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.2588235294117647 + }, + "copa": { + "acc": 0.82, + "acc_stderr": 0.038612291966536955 + }, + "hellaswag": { + "acc": 0.4731129257120096, + "acc_stderr": 0.004982561815214124, + "acc_norm": 0.6232822146982673, + "acc_norm_stderr": 0.00483572890373141 + }, + "rte": { + "acc": 0.48375451263537905, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.5974743488555643, + "acc_stderr": 0.01378286683170305 + }, + "storycloze_2016": { + "acc": 0.7172634954569749, + "acc_stderr": 0.01041380648612127 + }, + "boolq": { + "acc": 0.6128440366972477, + "acc_stderr": 0.008519429207594416 + }, + "arc_easy": { + "acc": 0.6245791245791246, + "acc_stderr": 0.0099362185271143, + "acc_norm": 0.6052188552188552, + "acc_norm_stderr": 0.01003003893588359 + }, + "arc_challenge": { + "acc": 0.29266211604095566, + "acc_stderr": 0.01329591610361943, + "acc_norm": 0.3302047781569966, + "acc_norm_stderr": 0.013743085603760427 + }, + "sciq": { + "acc": 0.914, + "acc_stderr": 0.008870325962594766, + "acc_norm": 0.889, + "acc_norm_stderr": 0.009938701010583726 + }, + "piqa": { + "acc": 0.7453754080522307, + "acc_stderr": 0.01016443223706049, + "acc_norm": 0.7611534276387377, + "acc_norm_stderr": 0.009948120385337484 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_3.json b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_3.json new file mode 100644 index 0000000000000000000000000000000000000000..575fb97b6be3cb2cc1f232f7ec91435a68cdecb7 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.311, + "acc_stderr": 0.014645596385722692 + }, + "anli_r2": { + "acc": 0.356, + "acc_stderr": 0.015149042659306626 + }, + "anli_r3": { + "acc": 0.3425, + "acc_stderr": 0.013704669762934727 + }, + "cb": { + "acc": 0.5535714285714286, + "acc_stderr": 0.06703189227942397, + "f1": 0.49967511371020135 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.4714200358494324, + "acc_stderr": 0.004981623292196191, + "acc_norm": 0.6261700856403107, + "acc_norm_stderr": 0.004828305041904401 + }, + "rte": { + "acc": 0.5342960288808665, + "acc_stderr": 0.03002557981936643 + }, + "winogrande": { + "acc": 0.6006314127861089, + "acc_stderr": 0.013764933546717612 + }, + "storycloze_2016": { + "acc": 0.729021913415286, + "acc_stderr": 0.010278188399635043 + }, + "boolq": { + "acc": 0.6103975535168196, + "acc_stderr": 0.008529228894936293 + }, + "arc_easy": { + "acc": 0.6292087542087542, + "acc_stderr": 0.009911292822056921, + "acc_norm": 0.6153198653198653, + "acc_norm_stderr": 0.009983171707008999 + }, + "arc_challenge": { + "acc": 0.2960750853242321, + "acc_stderr": 0.013340916085246258, + "acc_norm": 0.3122866894197952, + "acc_norm_stderr": 0.013542598541688065 + }, + "sciq": { + "acc": 0.911, + "acc_stderr": 0.009008893392651535, + "acc_norm": 0.892, + "acc_norm_stderr": 0.009820001651345693 + }, + "piqa": { + "acc": 0.7578890097932536, + "acc_stderr": 0.009994371269104376, + "acc_norm": 0.764417845484222, + "acc_norm_stderr": 0.009901067586473886 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_3_lm-eval_global_step80108_2023-02-15-11-04-05_3shots_backup.json b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_3_lm-eval_global_step80108_2023-02-15-11-04-05_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..575fb97b6be3cb2cc1f232f7ec91435a68cdecb7 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_3_lm-eval_global_step80108_2023-02-15-11-04-05_3shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.311, + "acc_stderr": 0.014645596385722692 + }, + "anli_r2": { + "acc": 0.356, + "acc_stderr": 0.015149042659306626 + }, + "anli_r3": { + "acc": 0.3425, + "acc_stderr": 0.013704669762934727 + }, + "cb": { + "acc": 0.5535714285714286, + "acc_stderr": 0.06703189227942397, + "f1": 0.49967511371020135 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.4714200358494324, + "acc_stderr": 0.004981623292196191, + "acc_norm": 0.6261700856403107, + "acc_norm_stderr": 0.004828305041904401 + }, + "rte": { + "acc": 0.5342960288808665, + "acc_stderr": 0.03002557981936643 + }, + "winogrande": { + "acc": 0.6006314127861089, + "acc_stderr": 0.013764933546717612 + }, + "storycloze_2016": { + "acc": 0.729021913415286, + "acc_stderr": 0.010278188399635043 + }, + "boolq": { + "acc": 0.6103975535168196, + "acc_stderr": 0.008529228894936293 + }, + "arc_easy": { + "acc": 0.6292087542087542, + "acc_stderr": 0.009911292822056921, + "acc_norm": 0.6153198653198653, + "acc_norm_stderr": 0.009983171707008999 + }, + "arc_challenge": { + "acc": 0.2960750853242321, + "acc_stderr": 0.013340916085246258, + "acc_norm": 0.3122866894197952, + "acc_norm_stderr": 0.013542598541688065 + }, + "sciq": { + "acc": 0.911, + "acc_stderr": 0.009008893392651535, + "acc_norm": 0.892, + "acc_norm_stderr": 0.009820001651345693 + }, + "piqa": { + "acc": 0.7578890097932536, + "acc_stderr": 0.009994371269104376, + "acc_norm": 0.764417845484222, + "acc_norm_stderr": 0.009901067586473886 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_4.json b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_4.json new file mode 100644 index 0000000000000000000000000000000000000000..b56dfdf3f1edbfaef8cacb230d1f7fab389105e8 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.344, + "acc_stderr": 0.015029633724408943 + }, + "anli_r2": { + "acc": 0.374, + "acc_stderr": 0.015308767369006356 + }, + "anli_r3": { + "acc": 0.34833333333333333, + "acc_stderr": 0.01375943749887407 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.19999999999999998 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816505 + }, + "hellaswag": { + "acc": 0.4715196176060546, + "acc_stderr": 0.004981680090303699, + "acc_norm": 0.6269667396932882, + "acc_norm_stderr": 0.004826224784850446 + }, + "rte": { + "acc": 0.48736462093862815, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5864246250986582, + "acc_stderr": 0.013840971763195304 + }, + "storycloze_2016": { + "acc": 0.7327632282202031, + "acc_stderr": 0.010233145255103061 + }, + "boolq": { + "acc": 0.6168195718654435, + "acc_stderr": 0.008503021391450788 + }, + "arc_easy": { + "acc": 0.6262626262626263, + "acc_stderr": 0.009927267058259625, + "acc_norm": 0.61489898989899, + "acc_norm_stderr": 0.009985214798737251 + }, + "arc_challenge": { + "acc": 0.302901023890785, + "acc_stderr": 0.013428241573185349, + "acc_norm": 0.3242320819112628, + "acc_norm_stderr": 0.01367881039951882 + }, + "sciq": { + "acc": 0.912, + "acc_stderr": 0.008963053962592078, + "acc_norm": 0.896, + "acc_norm_stderr": 0.009658016218524301 + }, + "piqa": { + "acc": 0.7529923830250272, + "acc_stderr": 0.010062268140772624, + "acc_norm": 0.7616974972796517, + "acc_norm_stderr": 0.009940334245876219 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_4_lm-eval_global_step80108_2023-02-15-11-04-05_4shots_backup.json b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_4_lm-eval_global_step80108_2023-02-15-11-04-05_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..b56dfdf3f1edbfaef8cacb230d1f7fab389105e8 --- /dev/null +++ b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_4_lm-eval_global_step80108_2023-02-15-11-04-05_4shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.344, + "acc_stderr": 0.015029633724408943 + }, + "anli_r2": { + "acc": 0.374, + "acc_stderr": 0.015308767369006356 + }, + "anli_r3": { + "acc": 0.34833333333333333, + "acc_stderr": 0.01375943749887407 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.19999999999999998 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816505 + }, + "hellaswag": { + "acc": 0.4715196176060546, + "acc_stderr": 0.004981680090303699, + "acc_norm": 0.6269667396932882, + "acc_norm_stderr": 0.004826224784850446 + }, + "rte": { + "acc": 0.48736462093862815, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5864246250986582, + "acc_stderr": 0.013840971763195304 + }, + "storycloze_2016": { + "acc": 0.7327632282202031, + "acc_stderr": 0.010233145255103061 + }, + "boolq": { + "acc": 0.6168195718654435, + "acc_stderr": 0.008503021391450788 + }, + "arc_easy": { + "acc": 0.6262626262626263, + "acc_stderr": 0.009927267058259625, + "acc_norm": 0.61489898989899, + "acc_norm_stderr": 0.009985214798737251 + }, + "arc_challenge": { + "acc": 0.302901023890785, + "acc_stderr": 0.013428241573185349, + "acc_norm": 0.3242320819112628, + "acc_norm_stderr": 0.01367881039951882 + }, + "sciq": { + "acc": 0.912, + "acc_stderr": 0.008963053962592078, + "acc_norm": 0.896, + "acc_norm_stderr": 0.009658016218524301 + }, + "piqa": { + "acc": 0.7529923830250272, + "acc_stderr": 0.010062268140772624, + "acc_norm": 0.7616974972796517, + "acc_norm_stderr": 0.009940334245876219 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_5.json b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_5.json new file mode 100644 index 0000000000000000000000000000000000000000..aadf4bb554b489342b6900d82cac3dd79e44390d --- /dev/null +++ b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.36, + "acc_stderr": 0.015186527932040126 + }, + "anli_r2": { + "acc": 0.368, + "acc_stderr": 0.015258073561521802 + }, + "anli_r3": { + "acc": 0.335, + "acc_stderr": 0.013630871843821474 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.2222222222222222 + }, + "copa": { + "acc": 0.8, + "acc_stderr": 0.040201512610368445 + }, + "hellaswag": { + "acc": 0.4727145986855208, + "acc_stderr": 0.004982346155911132, + "acc_norm": 0.6279625572595101, + "acc_norm_stderr": 0.004823604775015894 + }, + "rte": { + "acc": 0.5342960288808665, + "acc_stderr": 0.030025579819366426 + }, + "winogrande": { + "acc": 0.5895816890292028, + "acc_stderr": 0.01382510712003587 + }, + "storycloze_2016": { + "acc": 0.7220737573490112, + "acc_stderr": 0.010359403651225865 + }, + "boolq": { + "acc": 0.6079510703363914, + "acc_stderr": 0.008538802914911995 + }, + "arc_easy": { + "acc": 0.6233164983164983, + "acc_stderr": 0.009942848077476172, + "acc_norm": 0.6220538720538721, + "acc_norm_stderr": 0.009949405744045481 + }, + "arc_challenge": { + "acc": 0.302901023890785, + "acc_stderr": 0.013428241573185349, + "acc_norm": 0.3199658703071672, + "acc_norm_stderr": 0.013631345807016193 + }, + "sciq": { + "acc": 0.912, + "acc_stderr": 0.008963053962592085, + "acc_norm": 0.905, + "acc_norm_stderr": 0.0092769101031033 + }, + "piqa": { + "acc": 0.749727965179543, + "acc_stderr": 0.01010656188008979, + "acc_norm": 0.7546245919477693, + "acc_norm_stderr": 0.010039831320422384 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_5_lm-eval_global_step80108_2023-02-15-11-04-05_5shots_backup.json b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_5_lm-eval_global_step80108_2023-02-15-11-04-05_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..aadf4bb554b489342b6900d82cac3dd79e44390d --- /dev/null +++ b/4b284b28bc4seed4/evaluation/rankeval/4b284b28bc4seed4_5_lm-eval_global_step80108_2023-02-15-11-04-05_5shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.36, + "acc_stderr": 0.015186527932040126 + }, + "anli_r2": { + "acc": 0.368, + "acc_stderr": 0.015258073561521802 + }, + "anli_r3": { + "acc": 0.335, + "acc_stderr": 0.013630871843821474 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.2222222222222222 + }, + "copa": { + "acc": 0.8, + "acc_stderr": 0.040201512610368445 + }, + "hellaswag": { + "acc": 0.4727145986855208, + "acc_stderr": 0.004982346155911132, + "acc_norm": 0.6279625572595101, + "acc_norm_stderr": 0.004823604775015894 + }, + "rte": { + "acc": 0.5342960288808665, + "acc_stderr": 0.030025579819366426 + }, + "winogrande": { + "acc": 0.5895816890292028, + "acc_stderr": 0.01382510712003587 + }, + "storycloze_2016": { + "acc": 0.7220737573490112, + "acc_stderr": 0.010359403651225865 + }, + "boolq": { + "acc": 0.6079510703363914, + "acc_stderr": 0.008538802914911995 + }, + "arc_easy": { + "acc": 0.6233164983164983, + "acc_stderr": 0.009942848077476172, + "acc_norm": 0.6220538720538721, + "acc_norm_stderr": 0.009949405744045481 + }, + "arc_challenge": { + "acc": 0.302901023890785, + "acc_stderr": 0.013428241573185349, + "acc_norm": 0.3199658703071672, + "acc_norm_stderr": 0.013631345807016193 + }, + "sciq": { + "acc": 0.912, + "acc_stderr": 0.008963053962592085, + "acc_norm": 0.905, + "acc_norm_stderr": 0.0092769101031033 + }, + "piqa": { + "acc": 0.749727965179543, + "acc_stderr": 0.01010656188008979, + "acc_norm": 0.7546245919477693, + "acc_norm_stderr": 0.010039831320422384 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e87479935c29575a38b1dc69b58b3d09cc9c4bd --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac6ea2661a388771f34e7f01f95a5814c96300fee1d8a48b2d1742ad4aedf822 +size 199058647 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9bb9e79f8a0a9217fca04b2f3f69686c98369af --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5791acacb5ca9c4ea1e4f0deaaf11b308f26a572e80e33bd137d4c862ed920f +size 199058647 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d3010a0bde0c2ddf7583f22d87bd56087a1fc66 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2259ba3c93589d817307c0de28f6580f22d7b8f3833b516b70da9f9f7b0a7de2 +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cbc1cd26ea957b02007ddfd3e3d0c3fabd55472 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d880e0bd590daa428c4c42137116d9dea1fd95c4324e612c24b32b2caa8e00e0 +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57e8aabf45bb9de695b01487b5f97abf81ae7f85 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8b4128c2223a0592eb986b679e5e8114b0c4ad2da1c4526bd8ecf5d0d43cee4 +size 199058797 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7db037a8a00331e2b715c786e15f7ecd7ccc43e0 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8484ca568c79664d208e109be934eee2981e4734be31f4c1d1df4fb446fc7ea4 +size 199058797 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..315b315d21704d1fdcfc7fc297fd882b03eb7f88 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09aa46788f11822144e2124354225a3742c4e675cace775f4e4b393ad62db996 +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..071ee671f35f07340ce66e4a0c1e258064842a9e --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81f10b452f1586fd0af6c8b739da25451aa0bc58f2397b9ba078d86d22002c04 +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8afb3ccbfa987c348465dc1cbf51f07545e4e99 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c68d47fe92d5e7f38c00f69b235789d9db1508f42f82a1b4134fcc032d21ed3f +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dfa989978300c262b26c48431974d8b092b2b16 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:854c418431457ff80d44056b571bde968580254fe1df8080d5bc7c08c171c104 +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb3651d339c9826877e2279650ad3e0e8627769a --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80770735043a1fbf9f25e1f85ba70b25317e85c939971ce44a3b9faa245f6d3a +size 199058797 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2b2aca78b0ecae43edb8a0170b3584c1a0e303b --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5a5a6a24a707d5621e6a95e32387fd0e732d55e3e9def88fa3355a829b921a8 +size 199058797 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3275896d45574473952d944a8212dcd5b032072 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:817be724bbd1a26581b8d796f2e7ebb4101b6fd7ead39ffa26c8ea318de6ef92 +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7786560dc0444b660338e54b9d0cf71c59cdb936 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab1c9cdde538c1ba139876a956c34eb27edf905597b2a7d20f5e6dca4e5efbab +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..879c7a94150c036f64f2d6706144a42e405b6770 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:767d4de302f370cec7eaedf0d4d4d9e0ff07db67b86e4ce43a0dc4732681de74 +size 199058669 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e39c0bfcf04c8a5705b670368acad089f5c521ad --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beadc464b291e61fa87c31cae5e26fa02071806609656f9079e6901768f67f67 +size 199058669 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f21b7e9cd01c9ac6aeb05a6b3a905fbf13f9a542 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61aea27ee40140bdf95dccf0b7727e2ebfc5e9df5eeb74f6e0a0bff8928b75c4 +size 199058797 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..549a2dfdf9ef75c03a200e646c4feffb321f4dbb --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aee4a24cfb4b422b64eba375c39bf6b910d10c41b9d438f3f37977363c71f10 +size 199058797 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f1492cb9ea0474cb137bf24ed3406bf13836f5f --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5985b1e107a7517b8eeed53d9b40a11d8c46c91437bcd1b69caa4a6d1cdfbe3d +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..339c5d0ae1a483cf7082ed65f41adc8b4527e2f4 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bbedfb7edefb01636081fd58e5e8280c56688fe61bd2b5e2d557cbbc9128cb6 +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29dd4cefadf3233f68737cf5c19c8b3cd015c749 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc5cbaf8504fca406559e10b22282fb733a892d0299a26806bbf7445a5e2fc19 +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e9c5326b08e4ba576106bf327ded13e672ba644 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:047911e9af97222bc83845ba7a8d923b10989e52d79bdbb5ffd4e1b672592851 +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ebfe3f5172de5f38246cf4c3751c9b494ce98d4 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63f6bbfa45eaae16c5e08704db68c2cfaf1e7e91072b976509e1142d7a79442e +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5ac6dbe7a5fdfcc3623b1f35b1fb5af1cd82f4f --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd0144e4f181cb810abce29279f2415f73c5054bdcfe253913149d197951ac69 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..183ec99cd70e518e23f492f183d377833afb90ec --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24f089d472c517cde0c07f73f443435a34efb79ee0efde7e6bfeac231ed51016 +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c5a22f6f1ed77d82b6a981c404de6bc07089549 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bce826ab2ac24f864a31b4d34690f5dce43d3597175059c2a4c1627bbc5fccf2 +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..416db42c2ce93174352c1a008559f5afbcf5ab4e --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecd06fdbb2dd56725bf176b6649359b3c80c4227ce9f843b3b5a13d0f52056b6 +size 199058797 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4fc5f00eac282b7632551cbc1af8c71d8a6b017 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce5c87bee6e3033db9e1096e55c8b1602c1be6bb7537eda276f3b49a1a99aed2 +size 199058797 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bee6d82b5db7dcf68bef2b9c80c62e947d6416c2 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eed87198660ff8c930f986d459416ddc97b2c83bdc5ad22cd0ad16eebb792016 +size 199058605 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73f1a64d9cf65b357da5e27d9eb08640cc323ed4 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbb12d969cade86481b0f11b361d58a76da4bbee9129993e0f1234c755ee9be8 +size 199058605 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..349f23f658e1cae2fe26d2dec10ad0c1c83eb00b --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b77539f409c89dec6f7c36d701e1ea99c1f324ead43495b0315f6230cc59a2b +size 199058669 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c75bb271c7a5565680f475246304058b0a433fa --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:975f6b37ee6a7b6f8953e2dee692e2d94fbcf1c0102cecc1f955ebdf60b28236 +size 199058669 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9e55a237e6663632ca15667bdaa429bb5b5383a --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5a7e064a10295b0fd0db2a6810a28722e96368a8d14755b1394ef8bbc5bdb66 +size 199058797 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f1793741d9bb7e9ace33a7fd454b87e5eed7dd1 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36517d5d3a09f0da1fec0b3f084ea216c6184855bb751682c027605de968f816 +size 199058797 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af2d422e8413ea4d42eec38040cfd92e5db4eefc --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e3cbd02290ef20e08ccb976784f5f25211e8439f1800bb31cf8b88e806421c +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2f6279abf35a9e198b147da09f2803c3c91305a --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c1dd02a571b083d5e83a15f35559c531f4e4b25775e3ba4c2de77bd9c5b4303 +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7c382cd73d3c30be510f293f42abe71ef91d790 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab2fe5146c767e78acbb167724c803b943902e7d76ff9393e5813c8cc2c04e1b +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e72a11270b542e73b02a8b9314a19058546cdf0f --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6eed2da9086b208b7c72479d5ea3f15eef60509c250bccd682d82a3366fbf563 +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da2f61082ace685602e439b2c15c0233a2dcbc0f --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac8cd691980172107188a16fe8ae393fe0e445b9a17038d4968dc5dc461ef74e +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af9d7daf18a678b06b64ced3da9d03d9861f4720 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ba3fd00c1fd416664b71f290ae694e601850dc0301c7888cba793fc50e5c205 +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf73d12ee8b79f43cfce7524c028de651898e3e0 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b823de20b0df4ed278bf995d684ceaaa139b464d440050f4e2fe834b7e94e64b +size 199058797 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..748744c8aee8d2c6296a8351e6c48e209d0bcdf6 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f6166b510538dba42eb6b0f722c640c85ab69739981c6bddfe1a0d558fb0c8e +size 199058797 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b6c38398ada1436a5e2f6a5695fd17342ed17cf --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31703f1b24e4bc4f17ad97c339867f8d9c9ed1566cece5dcd13a01e653a5702d +size 199058669 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e25c5bf8d5581a7d8395ddc7bea93ec3d163bc44 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8972adca9bbff99a3fbdb2286a53375d0597babec3a4381e4643a0b91eeb8f5e +size 199058669 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3865d29cece56822b9a0dc838711ed5ed6a6112 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b113ba42b984b350b14db48260194e92fe92769be5820f7abd98470ff7edafc +size 199058850 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ee8ce2f1027ea825d0b6cff5f5923187c8427e6 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:745c85dbc679d286f2b0ade3025236102e52d979cfe88dc655af5b88fa69045b +size 199058850 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..adb87051b28a0590a69daea1e4eec8d5531325f6 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92148c489f0fb47ef9805ad06b64aff93e409227d7fa87104fb45ffc9e9d4bc2 +size 199058669 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d10df2e02a8cfb3ac5006eae4e9d59c83df12582 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3514f588f3f62176dd3f11a4b038a120246ac0241a20099f285d68030dce32cf +size 199058669 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a150acde7f7e2e1eb90b85c8af87af81c9cdfadc --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fb2dae208ea25736adc5cfdb91a1c88112a46c9a5590ace460ee873a5e8e9d9 +size 199058797 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad702d2277660817bc993b1fb87e6b6c56281005 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7d24b04648b44db734631cd8f03d034bafe0571f5a5a50b18b8dd56d316b0cd +size 199058797 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b700fdff4c488e8eba6ac74db81268812d9d3c8 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af4a8d209bf259349c59d118b32bd827839bf9ec0ab02c5074cd98d04215e3bf +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e333a23e7c10c25d2521aecdfbfaa03ae3ccb084 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a511109e424752fe770bcbf997fb258ddefd06c31786564e7d71e69fb1e427b +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7581b503181676d405d33aef9f4d76526d030084 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e335bd1d47215e4e1cb3ea028d2df69bd51611122b6726906c6f1febf332021c +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96e6567ce207f2aa38e4c7c5dbabc9af7bd2fd76 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd7415eefa010e7f4ff934c5935db2cadfb7a7d87ecceb6f2e5444e6f2239f20 +size 199058733 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7de92238d05e0d4554104b178b4b66249683b727 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bb426910cd1e4011c88009e34b1d30e93d68c4f74f7060c6049ca5551ae0f1d +size 199058669 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7234b1222b935dfac78a7a05bdab66bd81a55820 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89721e583a8587047873fd6b4adae4b5eb45dad30c9b993e5b8b34220979bbf9 +size 199058669 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be03710b0836d55dd48009e29ca475b4817b4186 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26575b7f33f217b943be077d4b253742c8027ef7bb967579e006faeeebccf473 +size 199058925 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffc58f4deca3f24012f81ca170e89d689fd32e4b --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c1bb6c298924a292484921d0f6c0981508adc6b4ccd67be0682af5de384124b +size 199058925 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be5abd238b8da20fb3a1090bd39d3e6b24f2fdb9 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c88ab83e5810061a3ee9ef598e1a0978f101baebcb635a2656091f6ae2511088 +size 199058605 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0627176420fc8d0c8a85c05f8e1e69f8e208e0a --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c64cb59e58d409bf4fc93fcd8e55fa2c5d5920403da2f52a301b37381a3fb961 +size 199058605 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd2c62f3d819c27fd25f2abe351db08ffb60fc10 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a19444377037a9795eddca6f2acb5a5c9194356689154967e4f396de1d63fa66 +size 199058605 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6b46ae5b174215fc3290d7e7236d66007fa5c4e --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08688528e0e02dab428ebe1da4e01b4c68e099dcd51c7569ee5bd9731eef7a1c +size 199058605 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32f525dba72d3d7f8d18ba2ab7d5445401a32d48 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b9223c76d9d91bb880f94a709958824feab9673570f0798265bff0e1b865c1a +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..831e026eb4ec6baa1af48d9eba593037a7878d6d --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1c823ae9b7389a1d0a12b3854af11fd32278427ed83118432f58efa76546247 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..488e7fec8f77735628fe846ced3a32ab4a898cc4 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1535df0caf6e4a33cf2cffb64c1c5b639842e4046e2c139d4f6b1dc2abf5fb40 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08b5d4834bd9f22fe895fc211989541d0e4e1fa3 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f36880028577dc788a346cca77f66ef808c0d7d6438c4fd9225e91b1b9b76c66 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0398c93c59926deafe705d0c3cf19e958bb7c79 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd489a0e23eb9e7f74977dfa35aba9165ab7a11d52b9ebfdff40a59b09db324b +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37d1ff787e1e81f03b436a6bb2de0c5091bb273a --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d71d2729437cf7eee27f033c6d10b1141ff888a9f3269f274949ecaf31aaa004 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e004c64e907d27eb9622c3081ea9fcbbebdd25d --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00225d9d87b81af3d2168ba0f208558aac3a7adb86a0f72d95cb646acf2b0b65 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68c7bd86a7e1f2a1aaf20963382ef054233c7a79 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44fbf9254f474cbceab8707e69d1c950fd9f2ed67528c109c84a162b39c22886 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ff1a380d96e66303adcef6975191c5662d3973c --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb6e10aad13df75ced7ad8fd9de22b0b0a47a8f8fc6b68a41baa30057f8afda7 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1407091bbc278163728228ed1261124179739f3c --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b81619a1633759895ef60211575e613d6620b18a776f8f982018967ae7a452c3 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..336b77ccc5cd1243139f1c810b4711fd5100587c --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32eb523df1a2e720b535f0f08d484b69d0b006ab547ed32a83b8697a257448f6 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba2bd4041ad07e55633e11f938d5feecb686a260 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d05db1cbaf5b756913f31ac23b94d3675f31f057eb15ed0276abb8b51492ec6 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6ea31ed9c832d8c9f0f0b5f4d22ee3bca5e2aa6 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faadb4755dd4d5c11078701f11b8cb2b026d637831a089909c2496e4a6827b4b +size 199058978 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bece009dcc8a1518b6336bc21dd1322e62afd07 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c255d273a7b9edba630a1cf45f2f5e0b95fd1f7f845f842de4a47588ef2187ec +size 199058978 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69cd8b5c67130edc93fe2e387918f432d79153c9 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5d08c662e332db274f0f148661411cfc0c73f5ff25fbf1a18a16f3bc88d63fe +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b27c78aed5cd14241df5b2f284ba24e82bb8788e --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96105a0662069f8c42c3f3998ded64d6146be6fdf622370d34b2454b4bd725ab +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5202460c8f841cdbc5672529c545a1874be59cc --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:447b29df1ac4435cfeef9ece4d2dfa5d03207aaa3bf3f42b9533fb1be55d3dcf +size 199058647 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb7b0437c235dba86114eb909d2cec035ee31aed --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8404a46ab2e265781b733885993fdaf9f14b88857585e91ab37d53168cde12e +size 199058647 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99a9022321bfa641414955e9960d3e3412371740 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b608afc1d8a5b55ce9a47c29878efb0935608de32d046fc81949a665ef4a147 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6257237e154b8309407a284323350f3fd95ec363 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11f7531dc8b68074084369e17ac2fcc48f06fa1d5de7d425147f942086cc181b +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37ef26b692d64caa75b0270dbef8e86ddd49c1e4 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99848aef64c456fe5414988c766fb2ed06c7c0f0266093b6628deb981ef87c7a +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a327d2a3e4fc1d3f4706a6d2d8d7f41f3b0a322b --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2059a0064df999d78ff7bcc5809deba2e5ae4bc4c93a79d007193bb90e5b87f6 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f216f13f7d8b596d547ee8a2dcff204fd9950178 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a6ee1f96a771165cbc707eba3d22c91b9705680c8c0c057b645897dd442702c +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c75df9df5130032216003ac841421a172bd196b7 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e64fc1c891622640430b0685921e13aed089a1b9636ec6ff6bb3c760af2608e4 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c509fce7cb791f21edf02a4112ae0c6acfef75f --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70e99c614fb9f2460be7dd3a77459d1be1c549a5c6f2f0ebe571dee3d3741f0a +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03153fbbc526c76d995c3dc6cb348d16a425b169 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a368ba4539ea986f5fa3169db6fef7166df6a5c6da3780d0b99115a2cd588844 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0263ee6815518dde969e134dba4085ebd18b106 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:225f5dce58090b24ba7e9ef008213246b1d6031a751a5ae83ec05107dfe2d653 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02cabb4fcbc0e2ecacee2de164c682b6abe568be --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcba51a7da02eacba5c271a30e16017696fba82715eaa0f51d9a70dcf3a3651a +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..893c12bf97ad96437a7ea7fa40c31cae6ac93f65 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dfcd6245ed5a83aa4967fadb3e6dd28df446ee02572229cf9174ef5e6a2b58e +size 199058850 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d0afa82eadbd711a571ab00456577e6a3d793a3 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95b5ded16d28ae0e0c645bdda8daae27dd8e0bad6bc606e7d7b1cab3034e2867 +size 199058850 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73f0d17529d81027bb23cc70beb3d6957795e68a --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e93a343a1695a37249f48a32fe9b7246db342fc37dec218b33545d7db8404b9 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f4adf5441c6d708369156a9e1c7c2836f421650 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fdd031674412d3652ddef0847bbc6e61ca81efc70b46bcbff237b815179cda9 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..367db10d1141f73ada2bdecfed76390ddedb7523 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b09bd6e2a350522ed29f618dac9c347e01f87bc1a26d3d134b3bcb3f73c70a5c +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4814ed6851fca8798a7555949bbb9afcd43c89d6 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba06ba43492147341dea062e5c6ac5ed34fc1c27844abef174eb35a4a908c26d +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f0d65752a188aba273c5dd534bbe3225118c570 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b16d01c09bd2a541d3a6dc10cc82b5dadee6f0212f2f104989564310a9b12ec7 +size 199058594 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f72cbdd6aa8451d22d6786bd91f31bb2fb241a3 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f87297d0ca183a0b2bc6d2d1dd75cc04018b43ff015c81ea1183eef827ae6ff2 +size 199058594 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..618e61346f4adedff5e4afe1f31af598abfb94cc --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7dfed9edc67f9ef8609557a094c98be5701230cae577c0eaa0c96928c0e37dd +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4e91a097aeacc538cb47a2b56678d9bc0c55afb --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ca3c296b42217c62eae848ead3fb2de4f134b25ab19e91115716156b1051474 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ca388411290dbcf9c104e165a69b7f483548815 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad99f9c94ec884b6ea507ff2bd73e3b57cc5aebe534601e6ede2f70d662e53a4 +size 199058711 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c47756e9ddd0a36eeb5ac614468bf4074950aea --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ede22dbf2265a6b69f587100e9d5f5244be6a5428db36fb9e7600d0154abbfdd +size 199058711 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c5fd32fd677c6a608d3bca10b6c0f49cc214bd7 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af970f8c4c451570f46ddc88f1e8f297889ce4689c9bea04b50bafb65f64bfa4 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4af80fb6312c9c313a1b99731b2adb2aea0e204a --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e26cdd9f97103e0b7603f01d612a57123d072107d5baa197e2317f2c87b18d6 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76cd019b999f61dcb1ca2bf5918bdb9d057375f9 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e38a9c3c010ff35acb78c04151c940deead6e500e28474067ef4293b775477c3 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a993a0bb872ebd8636ff7a025dbe29fff79eb5f --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6aa45c3cfe73572569e2e9c2c36361a9d62dbde5394b5757aa5fa4a49d365621 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa275af75ec309f8717b7ac9966d4c1cd86c2d2e --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b5a5133ef26f330661790222ee2e0da6b9a8848b294474b252a3bd046f7c5ef +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e2bb07f4e5cee02d9e390c2413d25858f7e0d35 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:119ac001238a249c90e869b2526ae59678d98ef8ae3651c85a22cf18eb2fa0dd +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a095ca43020d2a2457c45782ff22a7a8d47f8349 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78fa41c5de0c6f1cc7826591edfd39a7319b71123706690cfab6b78017f5bcc9 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..990c8fbab5f25fb2132be83084d55ed3288ce6d7 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7edae37023776434cca71a490e1de9c72d4c7372a789a7f71447433f83e042a4 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6c7c0e025c5ef6ab704608ee4770c3982d15b9c --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b6acba5a5f1784c2b58df7fa9ed7844a49ebdfff3a3d2dd9540410059fb4a57 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0e9d4d193789312e2a1e9dfac7befc4600f5c13 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5fce27e9630cdf8ff6113d28173b15002c400bd1f30759a322087003504773b +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8b6013ade2d19564d456a484c0d3bf72f3025e5 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd66031881ae99f98dd7c4c60fa9453b2a0ec02efbd3cda3f0067c9515835112 +size 199058594 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43472109622b7bc9a1dec131ead6609fb4d08cbb --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5923c03478829142877fabbbe26a4e51f1ef178cdc5fe17df427f36f867ecfd +size 199058594 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb2c585e864cc5cd3b46e0aaba689d25cb506f94 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4312823421e3a7b571464cdacd5fa75c69598d2da1adbb1a599366cca2c3dc6 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..350381bd5c2e508ee360c1cbbe662dd58dedefd4 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ea90c77680fadfcb629ef6e89d073f6b5b5c0f062162fd924944753c1fe2aa1 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..363fb17906544f267c2e4dfdb156b1ed542b219b --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d02d29d1b3bad7e2ecfac95535b1557a6fdde53d2d781e9c930553fa56f1f8d +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60de071f776d4c228ab1b12698d2ae2ce580c246 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17fce6a4d309b822622deafccbab45a629dd7b541f2faa2b46b37b5ade79e3e1 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63c95f99f467bb2bfc9257cf017d9a27f6d8fa5f --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8fbec5c1a47f704760cbfc99c6c98fb2ad38582449164f99cc670a3769d1a80 +size 199058850 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cefb112edc5c030a7858855198c5b5f12f167996 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d3f80a5a3ead9c7da37748cf4af505e26bc4b7c63e448b7f455dda5d8c13cb0 +size 199058850 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb5f4f889bb09e7f5fc984f2f92dfaf98729d385 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4859939e6e07ff839ebd74eda0183acb086018a52abda8e02a1b7035bb77bb5a +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11bf513d1f3379f24507cf1559f9530e041e7c83 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c91424d7bd2ed07ec612e91be517cdc4c966c677c924b92962674cb37cb887b4 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd6a33592b243a87898b262912085568164b936f --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09604eaa70cca68a58fd1e1ad4251c8ae770c2a1b96a8e664d0db9469ef74bd9 +size 199058647 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cfa4e68d8dcc24d094a176d5b9f68fb284dbfa0 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:453b1f157b5043758f672ae90a0cf706e4cb33d75cf365bb013d4537ea4fa772 +size 199058647 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..825f703884b515382b43dcb4f2fe4a39a0bf6479 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb51dae74e101b0239e6b0287302c7047f53138ad7f0e9f28582fc637c71b0e9 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63d846b0be26b8cf92f1a8f66f189b5ec388e373 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dc89ca53f483711093f5004c61b4c774ba6b98f148acd19a619b866f9e906f1 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32c85a7b1a59a07639e875aba75807879ccc7b65 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04ff3c39494f6c9bfff1909f215848151f64ad4dc5367d81a36c546098983aba +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41179624737eaef6a806734f92f7bfc0433bedbe --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da4a3084c683cb0b4243511dcd9a6029bfc11c7026c90bda72ce47c00df38eac +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62bfdbf91add50c9638040b343450755b27d621e --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26816881e8e4b0aa9292ab97200e975f598cd1b1335cd55a9f9809d01726758c +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28f64dc8491f1a7d68ba9f53d9fda28f46e8da4d --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6c94d012efb5bf05dea4869b940481fb093ca593df107cbc630c3ad191915b7 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ce53fc078a9ebc4bfbe6d35265c8e656c9a890f --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9e65b5eac86b2844caee9ca4c9c16a45e22e3598010017ba9d4c6bbe1d92781 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76f466955d671f3d456788341a1688011b678318 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ec5faca2f6f1168d4d7ac7ac4fbea722e28be07755bc5df327a14e1d3820252 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8729e4db6528226163cac39c1114a1d7a9c39927 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:985e20db4621055d585ed22d154d9ba7ebb84806f4e5ad1e41228fa25342e129 +size 199058850 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0c9e03a537d593f7e9b8796bcabd16aa111a01b --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5578cfcec3f35b0760746727e6e4e0e65fb7624cd3d31ef5fa78883477df06fe +size 199058850 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4858323a5baa0d930804df12ecf86fb2c28dcd3d --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65a51fad56ac18df9846276b1ad0ebd406d4298356890a836c4ebacc50f8a29c +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccaea4e48f88b3866a6ffb5f98d6791640e39838 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42ba1e3119923c212de10a12f4fd4072af935b076aac9a1ba220df2a8a390086 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77a798ac08de10fcdd4f6582403e33f716f2c28c --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abd94c06606a281ad2c941a1289d5603270b5ef7eb0d02b00e27f6d94739c2d6 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba4f9cfa64d7b69e76421ac83a13ed0e76d1e91b --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65fd87e78de7ba8c46dc38c79a9aa3add2437a20bb58cf2ed42c749012477940 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..855b0ff1830e02f4e2aaf22c2e955494b7ab55fe --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bda4534456ec9d518a6dc143dbb4f7e0538e07eb68c1926b9e386afb58a14268 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7d58906366b77bbc75a0d89bc10dbdf55d59f33 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:306f94a6e573e74cdafb0f318d760a855fb7710abf388b3747308acc3ee6cb44 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a38e1f22e06ce23e7914637f4cbb9d24e0aa512 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8996ddfebdf6b0c5da4921f3d7b44f7abc0db5c70865f8f41e50d33c90e66df1 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b157a3ad850e798b968ec81e244d89bab701d078 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b298d0bc784624186ccfabfdb6fac902f10ac99209fab66e2ca33c0abdfb796 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40f93c448cc848a30b0e3825c9910779006e6f1e --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2c8b771c7396e874675c39ccbb16b680c2984832ee935d95a063dcfbd8f255f +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25da55177ef1be2787bf37bd9bc704a72a648637 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b8c9a23ee171e09eacbc7fd6f77fa26450b486adcedb05c7f062bd0fc6c08d4 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e771b45893c10262f1a50860cfca7ae0c74198eb --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57da5b32b7e937fc85bbb9402865662ab7519b6aab5804f9eaace1c8eea15177 +size 199058775 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ff3439cc543ef81b61acc83c51c233d59f78a5c --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b3ee802c9e83690ab935deed8b2d159124a73e4731af2d8fe61ae9d365de033 +size 199058775 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25c9fdcf5ac10b570fa8730ffababce6f9695203 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c05e582f03aa309cfdc1a270647166b4db647f851b9fb1422be7b59dfc6bc59 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ed9f32a298170ec51462fb33cf43249017e655b --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c2c45eb6c470c306ef6f7c91d9f5869f4919abfb106157dcbae4dbb169e5af2 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d3ddc94b0d908a4190ee902b4999d6845b3a335 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b93bd1b03f9769c7156b995a146957ad74f1a8af3d4a3206f624c4c857c28faf +size 199058850 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7820f89a7c835c9e62cfe42a431859a166304193 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd94a1bb13c8d18ccef856137cfd2de60df01648b44a519bf1f12c6541ecd1ef +size 199058850 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..620bb0810c2b7c57fe3297546cbe7041c1284bdb --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:590f7028cd53babda4dc0fe727f30c707a20fd33b9584099dde611b8c9d535b5 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8acc66ee72d9e28a8f84a82d0718399ea7a26b6c --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8945dd9ea40558550c5a97564ac9fc048f0c7e6a6572b79e06f18eeafe328d3 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91e2efb2f8d72b045ecb879fbf5798ba01b51421 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b29dd1667af2e3c9f7db1e6a88c044f79702aa5ed5cec82983ad725fcfd5531 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..414d64c90be0ab45b14f630a3f54e23bb031cc1e --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6fc363cf7c3cb2bdc13bb2fd7847c4e1c79f98dacf51db85becc2bad8eecd2c +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56db2598ccffab06cee6f605d8cf3f0c92d8b9fe --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5103f98064030d9cd095ba8d7cfda8f17600b7c70f54c064360cf6c27a315f11 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7d5761b33b38f657f72d473bfba5a7b95d003b8 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28354c67b4ac626987c9a94acd69680a2ca6404b48de8e2cf6e624dbf435cb71 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b53b5df50c2627f790597c3002697aa6276d27da --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd9e3bce74e733748f52dd0b58509433f903f355d45e44b1a1fd4b6786f34c89 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da94c79b9466ee0fc8ddb644f61d62194f993f39 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f5e25135ebdaed2b862a1f4b085dd37995c17e1fb44b07afc05fded15f5e53a +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..afd95f094e8931dae75f91cc1b4af0caaf9d0057 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:859528a874502614d1856577bc6e5e93e71fffd553379244e4c389e3152d316e +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51b3cae282a324db333e60e49fcb2f847aef27cb --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffdaaa5aae4a48e7a7abc8ca3f8e0440c37bca4e73670fcfeae224af8176cc5d +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..924c6eb71d3342535fb6e6763bce26cd5916146b --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:327bedfff0b4b70351f3cbeb2f88a4bf77add56b7d846708bb46aa1ef61c6d31 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f758e9dfe43e949c3b2ccb5b9045d429cd65b9f --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30985b397036c3b0c1031f2af0433c3ae4c50ead81495c685035187ef5fe2f95 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..571c9fba9a763e29acc7abb00e3f08218e3087bd --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04abcefc029d499a666e54e096a74d5b5702d64f790816550b8019d538bd09d4 +size 199058914 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d41871b1c3a16c2fdfa65cf0f70ecefa5b7b5f4c --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4aed7e5ef19986f1432eab474264c1e05a3d2bac87a5a1f6a8505364ccfa165 +size 199058914 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b69ddbd20f38c36f6d92333eab32c9fa3ba35c3 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d74ce005ca71b603e3a50da27ab621c900d883eb89fd7e6b90dafac701048bf0 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bcb115bb682be7d4b7f0214f6c04844f9ec2369 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7866ffdea2ec8c3745c5cc2a7b8b45fd06b764c42c3a6759a4f15d5974a09ba +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29cef26e8aa83b3e73246cb0efb0263af34da6e4 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9b612f98c9b34cc8ac7157ad6dac1b93cf97da80d74c726a8c2faecf0fe5199 +size 199058711 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15715dfde77b890e4514713467f5b49a83ecbcef --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6ee529aadfa44d6a06a147188b4846b5adb188fe6be030e6acb4120c580c957 +size 199058711 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c505c4ae4652470a39291f6870bef5ea7b402a8 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:887895b130ad16898fc52b95f5a53a8cf1371b5520cf8826e7dabaf4d52bb714 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff810dd1ae3ecb741f612c1d6699c53f177c7b1e --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc31f078e417162006b22e9a1b2ce39d0fd22367654dbbd0a6434f199bf65bee +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9ef4567d93aff0779b8a600a77efa567900fc17 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e136b7203d295bac8e9612fa175bc69c36d4fe54e2c604bd1f61b6737dcf2408 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd351a0b118fb51fd36d72163aa37c485f26c144 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:590404b645f492120fa1c6c2cda2eda5ebedbb458d1abf8826c32dfa430ac7de +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..373734a69d941986a6442f8c7955adcde64aaac1 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af07d43d5d17516a9f15c8f8a628f548e578064439a98030d7a6d9494d5b5017 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b58c8f6e8b520ac7d59ef0c5f827130f24f6c986 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdbba166574dd597cd41d7f6840dea64c97d0949188a6b2a99de32d3d0987384 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8206cb3393061d81ed54fda14b9a5afa4e81a468 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90bc8730c64aadcc319f41079748c726d406874441f5b83d80ba8404d2a39c9f +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0d24f7e5d46679628baeaf4ecb78a8f3a09356e --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08dc48b9b9d2b2134e0fd006a3c84c6ed0f6d8c3e71ab04634e4f5df137dd15f +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17581567040f796c934994f2bf8ee3605960fa7d --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61b38b906027001356797b5a75a8a503e3ae3fa3ea2ccedbe654b0938571491c +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70b1bf25b44b50dc39cc4200678733e49760938e --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18180fbdefd5110d3e8363df7ee7dc754bc55ce9526dbb2ec45f6d8bae462f92 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ec0fe0b58055f1a8c21d5afe44ab26e0d4b8ecb --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abdd4918be80ca9b4459a9688af2cebd409c4e39b09bc0424b29b799fbd60bda +size 199058850 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1abb905bf7d6e7663bbf0e63aa95727dbe6700d --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8854d20f9d0387d9eecc3d75512e6881560dfb8f4778f2e6710f9c54e980d66 +size 199058850 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bcdaf77b76d7e2363da317ed9d0461a523766b3 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9347b38fc63398652df5143116421c43c8f6f9ec5abb2f2334acc3e62cb601a6 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40e213e67358624b5a64c8f526a474fb6999769b --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b789750b3a6995cd5bf25f0651edcf8cf0c594969c8f8f4e9669e22da44df98 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a789718efa79936cda78e0ca2078f07f8102ea8e --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52285a7c8725d9a742efee24ec3cdafd6b63d84fa48aa42536ac92769d692746 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..237d45f552bcfa10de5ad89dc4be85b1e7c62d21 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f14b80ceb2f24c387a42a152e274a63cb34b6fa3f3b85e9ad9da65cc6f61085 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa1e11b736e35aa93643af0b79f38e71ae9b1da7 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c51a7d5b59dda7aabeef56e418db94cfe8f4333d69b0e6fa0cfb3235910c12bc +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6df3294716c48e08609e7b06049c1675b9cc3e12 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7996b9df532b723ba3234aa7c1b4deb9fff29255f425ac1206a7ed095554ee98 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cac1f9389cc64c2bbef503877ed34df9939cf828 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a91da5a0e9c11857323932ba409cecc7ba901d2e0bb941bafca735c6d740922 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..233a437a7c4def2c147d5a26f120e32cec742e06 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf30a9d34bc9094f9b1db01f66211fac3f932b3d4721f9f4607ad5a5de3c6ee5 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a74ffbe92826214fb0935d1034de6ff1499b725 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3bf4de93f5e80774a49235d38430c82aebfe35e75609862e39003e73a988a0f +size 199058647 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de0c602379fc8a05723c05fc5eb8497a70967fc4 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17e1d0e24263a6608c3009c3dfd249982307972eea1242e157170582ad4b34a1 +size 199058647 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b485aae9b9c41eca82b9dd3c109a2a61f3df6093 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2254d17e73cc0d24dd562184e1ccebfd12b9e90e15aacc0d63f6101994d73c2 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d408c3041916ae6ac5d136e13b040a18b38db8c --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c82d1261699548696e9ed818cb732fb4a526f3886082fa4202da8415e5dcafed +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4cd7e1112f965be30a016df60ff652c25395d32 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:467a3e76756cc13898209a52fb6ee26621100de263e00a2e4214de4103de897e +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1648df9ebb9314d50feaf2259420a3a4cf168bcc --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:971bf42c3fef8c0f63f33f425982e3eea1d6c25f0c35d70192bc52e5f0f83070 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73ce9a586ef15c3164a8146daff3473171e254f8 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f39675fd63af85ebe7a28f9b6d28dfd4117c30fdccce8b19ae75465b67271a7 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c562dc2e70017d1bbe8ccf29c0eed1b61e20fa5 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9e5725309c9bef51d13e793bbb2b534df7c0ca5d66a01993946d6004b311fc2 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81fc109d97856fcaefd4103b6a08fa579a53f7a1 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a1a282143081d8b4f40e6e833f3c49b729e05f19d12722a356b70a7b28b0b1b +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc6b60506197a368cb99936b9b90e5e24bf02924 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64e7bbfa555579b44b5a8ab5faeaa51a081029832ee873c7d3eb644fe29171a2 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..604574d861647351c71aeadbe7b9ccf5a44ed2e6 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f61e0da9063cbbb450c60bad9071f092eb021a85daf5ca7534f5e51f33b7229 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..329f6213d36cef17680528f50acc6b623c506319 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fd9a1cf267082520c0525e5e2e19a7b51be1f729e5acc3d3a775aadf25b46f4 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b8ed75a47b783bff22dbabdff01237f9e9b561d --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a85334ed72467ede54f8af1e204e9f2187ebb4baadfd716021dc6505489568e0 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bc80cead4b4e9bc5f7323a26251a02c8222317f --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:027c55c87425c4436fcb092ec23a4be6ee25cda6baa8964713dedb05b16ec8f7 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6a12917af5cc15bd88c204b633abae22685b806 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3512f1e5509a5c43e2d307e5f0866546c019b09c07f8367f0b2f388c70be73d9 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a130d21a79de767407f9a12d1ea031893de9973c --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:461c3a613c4ed7a043fb95a09c5a6d2c4369b15aee34c8cd531e26bf72e364f9 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c79d560eb3c6efd208eb48edef613be979f219b1 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37987ec3a5751bd1b723cefc02d9f6256abd010370baae488d56d240654df7e2 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3f50266ad88faed70add483d8a0c32a7dbb6fba --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f642f431a1b266bd710a489ddd2458971215899da509c7b2b9684c4ffbe81d0 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfd7cd2e9bd1ae9c52846938d50b3d78f11c7834 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8110efc09aed8e6d0fbba0dba953c1734a28d15fc58f5feb76060357a9b4569e +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf2f7f8a9a9966b12493e79d6e548073ce3dc1d0 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:667712fd575113471529a8b7ef77142cac550084416bb09f757c045df72bb26a +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bd7c7eabcc7593ff89096808fdb3449eac32d14 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8fb24eb81266a6511dd03ee91fab2dea5b77c1751f9f244dfc970c1e02ce7be +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2baa5ce62ce605c10e05ce5172f26781470d2f0f --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76e68cf8eeede745af51fa9c55982e76ada25d387e70c88a7222be2b0fc9e098 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb22fe19fe3ef4ac8e86e8913f49a0561f64e27d --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bb6d1167cd3f5ad91834282f2675c48b59583c608d8f289fc30816384d6be29 +size 199058647 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd0b52ee7601ff95e523bef33eeae888de262619 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:523e563f10548b5c525053e6944584995d655190c7dba0adcd73fb59acb89984 +size 199058647 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..109f33e7eac6389d8e9e613dd09f3ad1c946476f --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35d1227559edf3fed21723b5a0b63fd748768879a87a4d138d3109330223a77e +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76be2cdf23b3249c4be2f7b07e036adcc9f17b64 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5739c934aff1a6696298ff7a748822024fc2ede0338f8e4463a96234145d509b +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7ab6bfd22a963985f58abc7c95ff009cd13cb93 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d003a7ff8adeb78a3b6f5c73de0ab7283a7fa8db62006d7721d9ea36e95220a +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..829d5f87454d0e6c83f040ddde0a8c1b27db4a9d --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:263194b2f87b947c0fafbb53d9afdaff24ac9877f19e8b58fce093141c664844 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..463c931518e5f7fc9180b9f19e14185332379e20 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d49727a59fcc6f92d4b783b73b70f49584ff494161687326cca25bf6788e4a5 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b50163dc86246c539f80a43faa2d5d0c9d7d5e56 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e42369209a4bf9663f0bb104e436d92901b57789131855a6f55c22474af6c689 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d199e377d2809c7469929ec2e5e122b32de8285 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e13d38615eb33f0b8b1340f6b3958238123d45e14cd46eebaef4426541871b5 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..706f80f28b5b3a82bc4603124a44720611eb77c8 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c575d55cb082ee5e6399fbba8e92e17e23793ebc8e6bd6bffe2c5324d752915 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35366401831a3b1d305899134c010277b931fdc2 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c09110c97213f0aa3408d3adce7fb16c91dc93f2cebf24a98b53b5e5c820e7f2 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a9d7b78ddb8e5e7d969c797be3ab5a749599e14 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a353861a23e11ddf948e62aa8d18c5b1aad06e5a13bbc423d5aa2920077ccf3 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2554b15ffafb5a4e1344c7008c72acd26ed8dc3 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a9b7d1dda65ec0d9be0872eab5acd051b9d010f9cb877db05d9ed58382bc79d +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d5547f75492bc2c74fc848c8dff278e36339081 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc378397f12ba1e64f85c344bde5ace986b0bfe476f49c7bf81c4c8667b803fb +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29c02a5d6a3470ecc414dfdb15bfc1f4d205a051 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75fcc8bf5c30b2911a75c103d2d338ff2b41770bec312bf2ff7f8f62a9087eb4 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcd10328b74d9ea03c72ce3297b18e99e07d0e3a --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08953db89f3bc260ef42ced50e5b18e268e6161c8824147843dd959158ffddf0 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5d4333dacbded9b3fdd4ae51cf304f46baf515c --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bc46fd52303e057ae4c86ec5d38a312e38a37cf7c28e78d38a1215e6399e17d +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5b7ce8799b99a876ab031e0a07ed74ebac15a11 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fc768abb4637a0aa8b1ed4179c9bdccdec09410644e02e7543b27e1b204c205 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dea4bc3f32223bf9654015b3ee6b2af9a6c81108 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:847fed1ab3511c6a4313c73a033f3f3bdbb8ef88a442cebe34795397eec002a5 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f66ed32431a1fb1e3889ca2963527af5545a753 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b82b0a8dbd70fe6b4e1ef425381b03cc8b31d34fcd0acd048dd8703207c5efd +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be9d67af8c8df6658b07440f2e9c405038e0f33d --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a57f6a7ab49e522fd54090b14b9b93f8ace467bf944d64eb7c2edc6a01abf2b4 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ef0935db8c5a941aca57e3d66e23d24d11f9d9a --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3035d8b994abda97d7d72b0affcff3754b66345d93d9ec7dc7640a890d0ef731 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9355ffa60808b3e54f5ab8ad85b30f8c540069a3 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfdb1eabcfdbb99d2ec7c39b7790d4121ef4854e7f732cf37262c236dcf359f3 +size 199058647 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4064819176947dfc3929b2a06f4ef56fe2c52a6 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a08379768a75efac766a22fbe1a4c9ebea324afa58f85c8322ccb224a76438b2 +size 199058647 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80231723408d3427a7e34535f9b17178e08407ee --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13b8fac7ff4159c0f2642697b9f2c9497e583f8233f05a2854a01f511b07c669 +size 199058850 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cc2a43a0430bbc88a62869edc144ec00d141876 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c911ce97797004d20beb1f81a285237f4019e3f5934c6750e95b62c7ba0aeb9 +size 199058850 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3923b4719cd699200a195ec8fa3b50fbd6133c3 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef9112dbaf9496203b42eea8fea5e7de1caf0b559780bbaf38dee2c387ac5b82 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7eea44150968a9060bad114f4e1c8810f521195b --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b6b8b2fac9a31d893e3774182fec1e9472c1c30078cbf4d811d99ff0e2ff172 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff956db8b62a05da8f66f00779298970841717c3 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb47d8ed015ec09fa30b8877552c4777659762c47b06a50e7f43d451e68a8b21 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc75cbe630e476a6af91ba0117e8cb4f44e9ce85 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7910b7c7888470312d4bc169adfd549464440f0bf4f28da0bc54b9b2aff4e55a +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07a295bb288778203dd9a349bd8b36c2bbba9d2a --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a13a72b34813c4348a2f973daff29f136fb409ef9405ef7d3d9c8feadf67ae8 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6070f8a8369ad9061be1af2a971b00663b8eb02 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:043bac9cafd2f95b4147d94c22ea92388695cedd434c249457d4bc3b14207174 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47563d13fe23b8019219265d73cf93e93d868baf --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a15f4df425a0dbbe57761a762e03a28f6c1cb3e4dd3b8b44a33e1a7fe72a2a8 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fb1fa0f69de61c15347e882db99cea753af0b0b --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:586a4fcc1efeff0974320ad728e5d83d7111eeeee323be9db0525c99ac43c770 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba6eb55da41898861d1ad9ecb3c1297b2682fb50 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77701e72d55c17c580d46385d1da71d9f8afd7bed9c78996b95bd2f11adf1d9d +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea8b6ffaff421032a2f84e37394c088e6e4b08f7 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2f1e3fc751efe6eac5068531ad36db7fac8d0d67850438a54a8372074e71d95 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb675f4a235a64e0c9326d8dfc96df050c7ad279 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb3ac4090d2012b1207c2b8698900e21a7830b313d44e277a1f1c4e754fa4f06 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3aff75e851bbf04d7e647ae595cc2ae0773719ab --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:842dbfeef2fb3cd9b4e334bf5d53d5bc8489e9be23c8a457084684a4216d04f6 +size 199058722 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84987f658291a3929c01592e2700abc481453ce5 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:854edfe75c018c1bbaef2a2c8ebb7d64c8f6570fc1d85fe2f67d36f5f94720a4 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c004a7035d62b5848cce1d72e78bbc297ce43dcc --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1de8ebf118f79732074d3c705044f6424b7b84b56b7c4f9904aa853468b1ac21 +size 199058786 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cccc79255faecb4c15b42cad6e0cd9981b38e8ae --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:519930e3583ceb6e19494c0b6a871971f68dc8d29c28f01c6482af421e126f2c +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ef32a6a589e0066a6b39315d01e05c2fe55b808 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ffa1d26105f4264af6341682750354d14b2ab35bc75a3c2f8ecc7c972cac59e +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a36ccf28eb03147cca4cb37b0a84a3336471ce8f --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5e68bde64a5dfd94d0c3ace76096f6e9d1cb079c6008a636a78989d27690a50 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33c4285884ccd9e8d95e766fd12efddf831f3b34 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92a24dac37d64de6550ed747dba7df55efb0bf5d18cc7aa8c5216dc9982e1a27 +size 199058658 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3a5f0894404c7f6a9c5b7ac3cd95e12e68967ec --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96c1cd172d10e065e65fbcadc5e2d3c360a3feda0dd2621cdcf6b42ec923a3c9 +size 199058839 diff --git a/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dde85c71b1d471028ebea4565c69e3fd6209a4b3 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:715f442aebdc274e737940310f29724cc154be1930591747849323179732b759 +size 199058839 diff --git a/4b284b28bc4seed4/global_step80108/layer_01-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c392b77f10824d30b7f668842329c9eb6df9e1a --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:114037903892ec8cea8e23d112b6f2326d921188c7e9fe01635561ec96d7ae37 +size 167511299 diff --git a/4b284b28bc4seed4/global_step80108/layer_01-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1491ffa39d6b1e1c0c6af25d688d5f2e17c416a --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7562bdaa876bc4979871fad23e228ca955d3cae2faf0174351045d55d5d7992 +size 167511299 diff --git a/4b284b28bc4seed4/global_step80108/layer_03-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..651dd61caed245fdb472ca3eff7c9a70ce3d43eb --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3ce6ff1e1049da01db545681f19ee93d547bd81433e221e8a61ae8fcb843d1a +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_03-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fb7a4c29a5c1872f3391788235a01295db44c14 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a933a6bca361f0fc88ff30281a460de030a8b4dcd1b82b80c904a742cfa530d +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_04-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc3fa7a6c6c37d0a03214d897d628306d928405f --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bf955870f0185104e1eb4a78baef46c6ff19be40233fbab23d8801455377f3f +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_04-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99ea897e0f8f8d2eb01e837c1d4b5f88d3a496cc --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6df86c58784a2838a0b4fe6ab71d38a537833adc0423bb43e20ff22e2da4f9a5 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_05-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7833b3e48c9ac9f504713de5d20661bc94d87800 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b40d7fc220f5131ec640299fb5c475885760cdc03958151ad9a3eae9645ae98b +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_05-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecfb4015fda9a9699cd4ae0e761e9d388fede59c --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aa8dc947f4e02c359f522625550d4eaa4dba5ee2dd07b17933c86349a9236e2 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_06-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fb8635b75578fa0c2ab3c3f239d6fa7488b9156 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fd31ee9d8ccd5523614681b8b888e70af599b42db514da86b6d74575f0314c6 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_06-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c76e1561f103f8e25107feef857ed695e8be4f2 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1eb9f6a6f4a70a0c60a8a7ef9afdb4e3db47e83b8c7563198f2f8eb39ca12fa7 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_07-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f81501a1687a631fd32e456a3cf8eb7865e7e5c4 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6af2757d6f6fd69bdeac2a41a73a64fc0c498ea5acbff354266103e1fa9804a5 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_07-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69c271eae80a52742f6472b1cfdacf368d8542b2 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c51c3de7bcd4bab31ddee8a6595f3cc62a84052ad9eae0bfc5ad7a5c2719ca4f +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_08-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a31d6deff71d1cc10e1d7706b81c6bcba0df63b --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57b20da6054f966037794fc65f071c635d77c1cc0d49848507762699427f9a44 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_08-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..178d13ace17728697c850e6e153f2c921104bdf8 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9af54387fdcf37cf5d531bfaa00c93c40fa846fe23dc208196cf00a6cdc14e67 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_09-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3ba9f739f0aa563c9ddf9ed15187288873520cb --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2afc404e55ea35b2d918080a16144ab9599150d88c12b9220c9a84608b1ab39 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_09-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3df6370afeb84e80084533b13b9f158161ba5c2a --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f3732b21d3496a1bea6dd18c5a3e7dff5c8e07c1d83f6a24e5ccc2adf61b089 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_10-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f6bced92bce6a949309aacb043192d1f0451958 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7dcdac9a6017aa51f6e920e7d418b584e2da24710fe0f0db6ba6b8f908d932d +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_10-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cb7c4fff6828ec69f801cc10a0ee98cbd6cd413 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1922d9699c03366852bfe62b81d3603e5a2082bd2fd581c34e0b302f569f920b +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_11-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b0e7a13ff8f6801a9976b3489fab36d531dd260 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e29de2863d05270fa2fc8afe41e839fed7dd043d67edd180640b6f95c7df736 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_11-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c19416220295b80bc797d28328f4b2bf9a9ba83f --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caf56c195c0065fd3bc9db126acff37dcde8f8686bc74d17fa351f4b5681c134 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_12-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b516783e8ba4963ff7b18227958f0ec82767b3e --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df2c80ea2f9c139257ed3cd40b1efc5a084afadf52922ef3190ee49498d4614a +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_12-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70a16fdd3dbda45ab68bdf87914645193510d8e0 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cba783da9ec4d1ab7ebf4fa2c1d39fb8541f0a0ca1feb9fb8926ebc370c62237 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_13-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3237265b73dbec2b1ed12c9166bfeac94e52997 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9983360eb9725db4b46de0806fd3b7bea84efde40672eab50f62fcf50a60e629 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_13-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de01ed6f29676fd91126b40d1914a6b87df4a775 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68f2a0057516462b8efef766c2b9a1c156b56f2e5db616b5210ac9e956ed1f0a +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_14-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8427df7e7f64086afb9ddaf4fdcc0a7112ea1d4 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd3e8679df5b0088400867d0c347619a0ddd7aa28cd6e60e99fac0527b35ede4 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_14-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d41cc049b377d4f2fd1c617dc5f10d36ef04ed0a --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e265536946261154a7746ce651b896b5397be7e32e250f1bfc4197fe02d64eb +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_15-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d380e0557bbcb58bdd3f82fc816886c4c85ba785 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:876c5820768eafa02e3a3b47cd0ac4689110d4162f62d397a36aceedc2a98f7c +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_15-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7bda280f561b0983ba7ea4e66f4755b5b9b8eb7 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4132272101e09553a79b1524867288f9287f35d419c13a2cdaf66d2b81fbe230 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_16-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dda36769b2d5f860dc1d9a195a00c6f9f263fc09 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bea5305e3bf4a69f8e6c786443dd2f7f5043c4afc7acd6762dce7cc36df57a13 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_16-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f00a80829ad3b0f2aa3946d4225c44d1cb2249b7 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d17713c72ba8ffee275fef0dcbc82450da122e022692572a94a13c83aea5b28 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_17-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..afc1526e3a0c29026d4cd8fde86e8f027540d619 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b5e3009b5846c55f4811c99eb92cf31a809e5004ef201f7cbf378ace76344a3 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_17-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9dd27a50b81271db2f1c7ee00717f5d6b2c8c30 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:544fb296738a2429cca387d573ae39d9ce829adc681fdf4aacb8589145f258db +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_18-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69a1c3c774350574938ee6995142c77ef84e65ae --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec8c433c13082d6eb7e310e3e9b2e92abc80dbc4d80e6062988c75eae87ae7fc +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_18-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfb6e53abec85dd5820302aa48aea84fee279ce4 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b94aa4693659a3898a2ed712a3919a6b1fbcae973a6e949262a364dd0093a08c +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_19-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa47f9d4f87fa8e3cc70ea798d8715e9c6cf67c6 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47a3c1f2d4107d565477ffd69efefd3b1d0481edd4426fc2afdf336fd68e12c4 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_19-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0aced3d5384629adfe289ee2f631e8a98838d6b0 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b6368f2337f54ab55d3ad1e41ca769de184f6eb9c782244a8dcc1d9b06eb691 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_20-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ffdbf91b512704996a2e2c97b5f29b3696c4930 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac0803792359d57fce07b5a267b9484eb38946d5b2818c27ded5a5c01d709512 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_20-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47231ca0dde2e3bb576cbc7fabeb434b9f8bdcfa --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbf9c99ef325d0b7343d518519a08bf1bc775079e6f8488e579406546992c962 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_21-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..857637f947a60c7f9ffec67e856a5ec895a2ca86 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee196b9eaf479db36be21edea82d4dd20dc4546c5e0343c0968f3c010453d02e +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_21-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c60616cab4c2e347ac6e08d4df5f8736d3a9603b --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41937ef3d7041160b806185f4b6b1d3f5b45a2cffda867ab90d57077ced2d2af +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_22-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce2c2aae6aab6c812025b68d35ff044f1592c742 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ac5ac5c90f401dfc144815f330105c596df6834cc5d85df1ddfb5acf0cca4cd +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_22-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd61c72081658a368599fc00c6a1af81d4d1ff12 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42edd6e9998185d3333b4892eb4654deb231ec2816bbf7e073619d00a9747927 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_23-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70cb1d19f5c5a1562375f33210e03d8680ec79c6 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4001cc0a922e73d6da513e1de1c58053b7bb24b6835e3b336df1e08334c197cd +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_23-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..035fbbef600f9ba699a79a6fb837b3bb485abbec --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:994b39a8f6f7813e3698865bab75ff994f61a4ee1b2e4f32ce5b63e969866c29 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_24-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b36ba95b5f02cba27cf23bdc1076978f45a515c --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dc7d2bb2fc0a7958dffb3ed4e6100b063c2dd3d59ca36f41dc2f31c1580cc6e +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_24-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5798944f3344d2c6510d6503946dc407c54f0940 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4387371b2ab78a16129a38bb665ec1e4fa9f846da8ab1f066c9a1e4efd5cc07 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_25-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cc0193eabb6a29765a097c500be6f4d1f6f38f9 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbff909e0b8820a87fdee9d5b10090c2f77404d92e529d89881b1e5719f32bc3 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_25-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23f7aecd3fb8b19ce78c9ba399ae97d0fffd721e --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:450aa17f5be7e1d55a56ff353b111b2f12ec6f72f54af0e653c8bf228854bdfb +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_26-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a7c32770ffd97c30acda28875aed9be3aa8e56f --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0e503b9e6c1860e069c490694bfc9611de21168f9e950bf81c5be544d74e427 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_26-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..efd127aff980de44a2b0774776d085e9ba1f9e6b --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c41b66e8626951c866100ada9ec1bc7c3b844f862d69aa6597c8a59a2b6c7698 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_27-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..011438aaa45138fe9187dcefb1c2fd23ee9140c6 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d1c70ce57b71fc852963d5bf9593ad1bfcad3c89fc434f335ec0d08efa7a00a +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_27-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81aa2ee738632ef787213df7f79afd65543e80f3 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd9267d84ff556253ab757f63e5876a2fb386e92a5091a09f387d31e187ce69a +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_28-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e32da0f8e86ab022dd9614c2e1ccc654cdf4c09 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46ea92b17f5e917fb2a153aab09350382cebefc8cc6258ecea4ee932178cea06 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_28-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ffc821d5dc67d785be67a4445f097c28cc740a5 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4af41b1a9a3866ace2d35dcc49dce5b0af282be72039d832650fd47fea681b8a +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_29-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2056cf8351ad65e6fab2b0885367b08e828cc6a6 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e2a8065174d11ec60294b92949429a8963eac591757456de1922668b840780b +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_29-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1aba1eb4dda1974e7d07653f913b5967138310e --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50ad6420b13a9109d8dd8bbc98a416a55d171eecdde82422e2c2b3c595910d61 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_30-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19c4bad4d7c509937c09efde68de52e30f28015c --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b695b03286f1978d001f3ca48fa425d69d9e4275d9cb880e356f7b9766616c1 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_30-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9e2cfb5d24e29ac58eea351e22519fbc5535e87 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:319a1151f9340d8670f2c915450ecbf03cbc386f58cef25800ea70a51e1c3fba +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_31-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a4075cf61ff3c65eac5461953599e6d09b8b12a --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9130872c24085ae2f74fb09df290c63296f13fe1fddb8b164c66b4276eccfa81 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_31-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73f129a9f66d7d03fd9fcbfef14316e34c4252ec --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:649eb9d351a19db46c3c1199adff97e85e42e473d8ee8ea695566e85d3ccd1e8 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_32-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18321f143f7877ac0491f79f4f2584e48e7bbb8e --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24c2d9fd4dd83103970d247e417be8d02eefe00cd2817bb36cfa45d99d0a2e94 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_32-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85de10fc13953206860a4b9b442a9c7fae1ad2a3 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3facdc21c7202b74e46bfd515f046de9dfc160a99c80300d041ecb5d41d66d4 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_33-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b793846e74288d0deb7e9970ac47d725f7813094 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:102436e4a93a94b881d6a3eb112cd6b4bd4e63b0f3673028033a53979897ae01 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_33-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74551f94d62ce71f3238a473cf719b27458f046d --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4754e04f84b4a214c6148bd539a581312c13077a0033ccaf7e0b66c6aa01e26d +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_34-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59a8b3c97cc4ced4b142d00910591bfe8beba306 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d47186165fc70de02f01a88a45c305cbd6a0b52102fe2d96c16aab6aaa9040e +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_34-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9657e70b97e7cd8f48b7235f24215cada194f92a --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfb2a28d12a16b627972ca8f81e9a0b255d3d28ef9241f9c667c9bc8db35bb4e +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_35-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fda84aa7b6d50b4a7e15b864eccf789cfe8db42 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c28e4d5bc389f65c4104da413fee87c7985eafe9ecabc552bcd75881a4767f2f +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_35-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04b6b4be40578410dd17c22cbadf98ffe4387a1f --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70a2aa3d2b8472076375e064e84e8778fb020e465ee10058657a4221bc9d041a +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_36-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe8f505e939472b1895ca7aeff780d6bb46882f1 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b81fe232c0f1fe799c8016e358f867c03b2b8d50d4df6a09a67f09780935377 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_36-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..977f333667a17b02b013974eeefecce9c354fa45 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a580f7d6c31aaef106e3ef39791df52e7a893a95d25dce2b606f6aa1c411446b +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_37-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eaac6a1fcc5159cea6ab1eb9e53af9f6c2d6296c --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80257a11bbcb9493f5d3793c232f53c80ace8c98b4e9257668e37c1c73703bf0 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_37-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fd55a241a1aa76a4356749cbdd3627e70d688b6 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:532905908dbe68b014c5980b2f55409602e80ddd4fdd99c75e08ef7e94542f68 +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_38-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2a7314d19ce4385435f0e4fbe04f0ebc16284a5 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fca18b97dafbf9ae75125c5d1aa2a6733e65687dc4c1e5d7cad4ab9e6e76ebbc +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_38-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b01f12e017198047fa72080ac1962b6cb57bbe97 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d05276d265806b286cafbee1ca2c9a4155d7131fea754d22f6dbecf3e84294b +size 113308931 diff --git a/4b284b28bc4seed4/global_step80108/layer_40-model_00-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72de28bd58bfc241f7aa3cebc9ef05be301e63f7 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55fb988b9a344b470f311aa490830ce6c6a119a674b8ca2d2fca300005fbfbd0 +size 13507 diff --git a/4b284b28bc4seed4/global_step80108/layer_40-model_01-model_states.pt b/4b284b28bc4seed4/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61f35ad8221a534946d19033e0ba68c1862c9138 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12931461186370c8c30133ee5ff8c66f51968ecf371d8b41ef3eb1b40f366d5d +size 13507 diff --git a/4b284b28bc4seed4/global_step80108/mp_rank_00_model_states.pt b/4b284b28bc4seed4/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35f08a226199bad1ba694947d333e568fdc863be --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64d7c963ecfbb831d714a0f528e8942967c34ba3015ca82d241617c2c2faa02e +size 51443 diff --git a/4b284b28bc4seed4/global_step80108/mp_rank_01_model_states.pt b/4b284b28bc4seed4/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65cfb3520f7257ecbe84d6298600a53db4608571 --- /dev/null +++ b/4b284b28bc4seed4/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a37995ccfd443e7a9e13b79c90ad3cb5440412da405810093e89b4093c2dba75 +size 51443 diff --git a/4b284b28bc4seed4/transformers/config.json b/4b284b28bc4seed4/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b28bc4seed4/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b28bc4seed4/transformers/pytorch_model.bin b/4b284b28bc4seed4/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..bd6f4da2b6a26608c470bce0a960f8a449feefd4 --- /dev/null +++ b/4b284b28bc4seed4/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cde7d83be3c242b4b8007eb7a67f19e5b13a0e14ea93f2f269efbfdddffb84c1 +size 8781203669